Repository: vipshop/vire
Branch: master
Commit: fdb7db80f875
Files: 174
Total size: 1.6 MB

Directory structure:
gitextract_y_mdrj8b/

├── .gitignore
├── ChangeLog
├── LICENSE
├── Makefile.am
├── NOTICE
├── README.md
├── conf/
│   └── vire.conf
├── configure.ac
├── dep/
│   ├── .gitignore
│   ├── Makefile.am
│   ├── ae/
│   │   ├── Makefile.am
│   │   ├── ae.c
│   │   ├── ae.h
│   │   ├── ae_epoll.c
│   │   ├── ae_evport.c
│   │   ├── ae_kqueue.c
│   │   └── ae_select.c
│   ├── darray/
│   │   ├── Makefile.am
│   │   ├── darray.c
│   │   └── darray.h
│   ├── dhashkit/
│   │   ├── Makefile.am
│   │   ├── dcrc16.c
│   │   ├── dcrc32.c
│   │   ├── dfnv.c
│   │   ├── dhashkit.h
│   │   ├── dhsieh.c
│   │   ├── djenkins.c
│   │   ├── dketama.c
│   │   ├── dmd5.c
│   │   ├── dmodula.c
│   │   ├── dmurmur.c
│   │   ├── done_at_a_time.c
│   │   ├── drandom.c
│   │   └── dsha1.c
│   ├── dlist/
│   │   ├── Makefile.am
│   │   ├── dlist.c
│   │   ├── dlist.h
│   │   ├── dlockqueue.c
│   │   ├── dlockqueue.h
│   │   ├── dmtqueue.c
│   │   └── dmtqueue.h
│   ├── dmalloc/
│   │   ├── Makefile.am
│   │   ├── dmalloc.c
│   │   └── dmalloc.h
│   ├── himemcached-0.1.0/
│   │   ├── Makefile.am
│   │   ├── himcdep/
│   │   │   ├── sds.c
│   │   │   └── sds.h
│   │   ├── himcread.c
│   │   ├── himcread.h
│   │   ├── himemcached.c
│   │   └── himemcached.h
│   ├── hiredis-0.13.3/
│   │   └── .gitignore
│   ├── jemalloc-4.2.0/
│   │   └── .gitignore
│   ├── jemalloc-4.2.0.tar.bz2
│   ├── sds/
│   │   ├── Makefile.am
│   │   ├── sds.c
│   │   ├── sds.h
│   │   └── sdsalloc.h
│   └── util/
│       ├── Makefile.am
│       ├── dlog.c
│       ├── dlog.h
│       ├── dspecialconfig.h
│       ├── dutil.c
│       └── dutil.h
├── m4/
│   └── .gitignore
├── notes/
│   ├── c-styleguide.txt
│   ├── debug.txt
│   └── socket.txt
├── scripts/
│   └── .gitignore
├── src/
│   ├── Makefile.am
│   ├── vr.c
│   ├── vr_aof.c
│   ├── vr_aof.h
│   ├── vr_backend.c
│   ├── vr_backend.h
│   ├── vr_bitops.c
│   ├── vr_bitops.h
│   ├── vr_block.c
│   ├── vr_block.h
│   ├── vr_client.c
│   ├── vr_client.h
│   ├── vr_command.c
│   ├── vr_command.h
│   ├── vr_conf.c
│   ├── vr_conf.h
│   ├── vr_connection.c
│   ├── vr_connection.h
│   ├── vr_core.c
│   ├── vr_core.h
│   ├── vr_db.c
│   ├── vr_db.h
│   ├── vr_dict.c
│   ├── vr_dict.h
│   ├── vr_eventloop.c
│   ├── vr_eventloop.h
│   ├── vr_hyperloglog.c
│   ├── vr_hyperloglog.h
│   ├── vr_intset.c
│   ├── vr_intset.h
│   ├── vr_listen.c
│   ├── vr_listen.h
│   ├── vr_lzf.h
│   ├── vr_lzfP.h
│   ├── vr_lzf_c.c
│   ├── vr_lzf_d.c
│   ├── vr_master.c
│   ├── vr_master.h
│   ├── vr_multi.c
│   ├── vr_multi.h
│   ├── vr_notify.c
│   ├── vr_notify.h
│   ├── vr_object.c
│   ├── vr_object.h
│   ├── vr_pubsub.c
│   ├── vr_pubsub.h
│   ├── vr_quicklist.c
│   ├── vr_quicklist.h
│   ├── vr_rbtree.c
│   ├── vr_rbtree.h
│   ├── vr_rdb.c
│   ├── vr_rdb.h
│   ├── vr_replication.c
│   ├── vr_replication.h
│   ├── vr_scripting.c
│   ├── vr_scripting.h
│   ├── vr_server.c
│   ├── vr_server.h
│   ├── vr_signal.c
│   ├── vr_signal.h
│   ├── vr_slowlog.c
│   ├── vr_slowlog.h
│   ├── vr_stats.c
│   ├── vr_stats.h
│   ├── vr_t_hash.c
│   ├── vr_t_hash.h
│   ├── vr_t_list.c
│   ├── vr_t_list.h
│   ├── vr_t_set.c
│   ├── vr_t_set.h
│   ├── vr_t_string.c
│   ├── vr_t_string.h
│   ├── vr_t_zset.c
│   ├── vr_t_zset.h
│   ├── vr_thread.c
│   ├── vr_thread.h
│   ├── vr_util.c
│   ├── vr_util.h
│   ├── vr_worker.c
│   ├── vr_worker.h
│   ├── vr_ziplist.c
│   ├── vr_ziplist.h
│   ├── vr_zipmap.c
│   └── vr_zipmap.h
├── tests/
│   ├── .gitignore
│   ├── Makefile.am
│   ├── vrabtest.c
│   ├── vrabtest.h
│   ├── vrt_backend.c
│   ├── vrt_backend.h
│   ├── vrt_benchmark.c
│   ├── vrt_check_data.c
│   ├── vrt_check_data.h
│   ├── vrt_dispatch_data.c
│   ├── vrt_dispatch_data.h
│   ├── vrt_produce_data.c
│   ├── vrt_produce_data.h
│   ├── vrt_public.c
│   ├── vrt_public.h
│   ├── vrt_simple.c
│   ├── vrt_simple.h
│   ├── vrt_util.c
│   ├── vrt_util.h
│   └── vrtest.c
└── tools/
    └── .gitignore

================================================
FILE CONTENTS
================================================

================================================
FILE: .gitignore
================================================
# pyc
*.pyc

# Compiled Object files
*.lo
*.o

# Compiled Dynamic libraries
*.so

# Compiled Static libraries
*.la
*.a

# Compiled misc
*.dep
*.gcda
*.gcno
*.gcov

# Packages
*.tar.gz
*.tar.bz2

# Logs
*.log

# vire
*.swp
*.~
*.project
*.cproject

# Core and executable
core*
vire

# extracted jemalloc
!/dep/jemalloc-*

# Autotools
.deps
.libs

/aclocal.m4
/autom4te.cache
/stamp-h1
/autoscan.log
/libtool

/config/config.guess
/config/config.sub
/config/depcomp
/config/install-sh
/config/ltmain.sh
/config/missing
/config

/config.h
/config.h.in
/config.h.in~
/config.log
/config.status
/configure.scan
/configure

Makefile
Makefile.in


================================================
FILE: ChangeLog
================================================
 2016-10-25  deep011  <diguo58@gmail.com>
    * vire: version 1.0.0 release
      vire (pronounced "vip-redis") is a multithread redis(based on redis-3.2.0) maintains in vipshop.
      multi-threads support.
      command type CONNECTION supported: ping,quit,echo,select,auth,admin.
      command type SERVER supported: info,flushall,flushdb,time,dbsize,command,config,client,slowlog.
      command type KEY supported: del,exists,ttl,pttl,expire,expireat,pexpire,pexpireat,persist,randomkey,type,keys,scan,object.
      command type STRING supported: get,set,setnx,setex,psetex,incr,decr,incrby,decrby,append,strlen,getset,incrbyfloat,setbit,getbit,setrange,getrange,bitcount,bitpos,mget,mset.
      command type HASH supported: hset,hget,hlen,hdel,hexists,hkeys,hvals,hgetall,hincrby,hincrbyfloat,hmget,hmset,hsetnx,hstrlen,hscan.
      command type LIST supported: rpush,lpush,lrange,rpop,lpop,llen,lrem,ltrim,lindex,lset.
      command type SET supported: sadd,smembers,scard,srem,spop,sismember,sscan,sunion,sunionstore,sdiff,sdiffstore,sinter,sinterstore.
      command type SORTEDSET supported: zadd,zincrby,zrange,zrevrange,zrem,zcard,zcount,zrangebyscore,zrevrangebyscore,zrank,zrevrank,zscore,zremrangebyscore,zremrangebyrank,zremrangebylex,zscan.
      command type HYPERLOGLOG supported: pfadd,pfcount.
      config option added(used for config file and 'config get/set' command): port,databases,internal-dbs-per-databases,requirepass,adminpass,commands-need-adminpass,maxclients,maxmemory,maxmemory-policy,maxmemory-samples,max-time-complexity-limit,slowlog-log-slower-than,slowlog-max-len.
      viretest added that is for unit test.
      vireabtest added that is for compare command execution and data consistency with redis-3.2.0.
      vire-benchmark added that is modified from redis-benchmark but multi-threads supported and pressure test vire.

================================================
FILE: LICENSE
================================================

                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      "License" shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      "Licensor" shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      "Legal Entity" shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      "control" means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      "You" (or "Your") shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      "Source" form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      "Object" form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      "Work" shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      "Derivative Works" shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      "Contribution" shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, "submitted"
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as "Not a Contribution."

      "Contributor" shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a "NOTICE" text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an "AS IS" BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

================================================
FILE: Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in aclocal.m4 configure config.h.in config.h.in~ stamp-h.in

ACLOCAL_AMFLAGS = -I m4

SUBDIRS = dep src tests

EXTRA_DIST = README.md NOTICE LICENSE ChangeLog conf scripts notes


================================================
FILE: NOTICE
================================================


================================================
FILE: README.md
================================================
# vire

**vire** (pronounced "vip-redis") is a multithread redis(based on redis-3.2.0) maintains in vipshop.

### QQ交流群：276406429

## Dependence

Please install automake, libtool, autoconf and bzip2 at first.

## Build

To build vire from source with _debug logs enabled_ and _assertions enabled_:

    $ git clone  https://github.com/vipshop/vire.git
    $ cd vire
    $ autoreconf -fvi
    $ ./configure --enable-debug=full
    $ make
    $ src/vire -h

A quick checklist:

+ Use newer version of gcc (older version of gcc has problems)
+ Use CFLAGS="-O1" ./configure && make
+ Use CFLAGS="-O3 -fno-strict-aliasing" ./configure && make
+ `autoreconf -fvi && ./configure` needs `automake` and `libtool` to be installed

## Run

    $ src/vire -c conf/vire.conf -o log -T 6 -d

## Features

+ Multithread.
+ Fast.
+ Works with Linux, *BSD, OS X and SmartOS (Solaris)

## Help

    Usage: vire [-?hVdt] [-v verbosity level] [-o output file]
                [-c conf file] [-p pid file]
                [-T worker threads number]
    
    Options:
    -h, --help             : this help
    -V, --version          : show version and exit
    -t, --test-conf        : test configuration for syntax errors and exit
    -d, --daemonize        : run as a daemon
    -v, --verbose=N        : set logging level (default: 5, min: 0, max: 11)
    -o, --output=S         : set logging file (default: stderr)
    -c, --conf-file=S      : set configuration file (default: conf/vire.conf)
    -p, --pid-file=S       : set pid file (default: off)
    -T, --thread_num=N     : set the worker threads number (default: 6)

## Support redis command so far

#### Connection

+ ping
+ quit
+ echo
+ select
+ auth
+ admin

#### Server

+ info
+ flushall
+ flushdb
+ time
+ dbsize
+ command
+ config
+ client
+ slowlog

#### Key

+ del
+ exists
+ ttl
+ pttl
+ expire
+ expireat
+ pexpire
+ pexpireat
+ persist
+ randomkey
+ type
+ keys
+ scan
+ object

#### String

+ get
+ set
+ setnx
+ setex
+ psetex
+ incr
+ decr
+ incrby
+ decrby
+ append
+ strlen
+ getset
+ incrbyfloat
+ setbit
+ getbit
+ setrange
+ getrange
+ bitcount
+ bitpos
+ mget
+ mset

#### Hash

+ hset
+ hget
+ hlen
+ hdel
+ hexists
+ hkeys
+ hvals
+ hgetall
+ hincrby
+ hincrbyfloat
+ hmget
+ hmset
+ hsetnx
+ hstrlen
+ hscan

#### List

+ rpush
+ lpush
+ lrange
+ rpop
+ lpop
+ llen
+ lrem
+ ltrim
+ lindex
+ lset

#### Set

+ sadd
+ smembers
+ scard
+ srem
+ spop
+ sismember
+ sscan
+ sunion
+ sunionstore
+ sdiff
+ sdiffstore
+ sinter
+ sinterstore

#### SortedSet

+ zadd
+ zincrby
+ zrange
+ zrevrange
+ zrem
+ zcard
+ zcount
+ zrangebyscore
+ zrevrangebyscore
+ zrank
+ zrevrank
+ zscore
+ zremrangebyscore
+ zremrangebyrank
+ zremrangebylex
+ zscan

#### HyperLogLog

+ pfadd
+ pfcount

## License

Copyright © 2016 VIPSHOP Inc.

Licensed under the Apache License, Version 2.0: http://www.apache.org/licenses/LICENSE-2.0


================================================
FILE: conf/vire.conf
================================================
################################## NETWORK #####################################

# By default, if no "bind" configuration directive is specified, Vire listens
# for connections from all the network interfaces available on the server.
# It is possible to listen to just one or multiple selected interfaces using
# the "bind" configuration directive, followed by one or more IP addresses.
#
# Examples:
#
# bind 192.168.1.100 10.0.0.1
# bind 127.0.0.1 ::1
#
# ~~~ WARNING ~~~ If the computer running Vire is directly exposed to the
# internet, binding to all the interfaces is dangerous and will expose the
# instance to everybody on the internet. So by default we uncomment the
# following bind directive, that will force Vire to listen only into
# the IPv4 lookback interface address (this means Vire will be able to
# accept connections only from clients running into the same computer it
# is running).
#
# IF YOU ARE SURE YOU WANT YOUR INSTANCE TO LISTEN TO ALL THE INTERFACES
# JUST COMMENT THE FOLLOWING LINE.
# ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
# bind 127.0.0.1

# Accept connections on the specified port, default is 55555.
# If port 0 is specified Vire will not listen on a TCP socket.
port 55555

################################# GENERAL #####################################

# Set the number of databases. The default database is DB 0, you can select
# a different one on a per-connection basis using SELECT <dbid> where
# dbid is a number between 0 and 'databases'-1
databases 6

# Set the number of internal dbs for every databases. This is used for
# multi-threads avoid too much locker competition.
internal-dbs-per-databases 6

################################## SECURITY ###################################

# Require clients to issue AUTH <PASSWORD> before processing any other
# commands.  This might be useful in environments in which you do not trust
# others with access to the host running redis-server.
#
# This should stay commented out for backward compatibility and because most
# people do not need auth (e.g. they run their own servers).
#
# Warning: since Redis is pretty fast an outside user can try up to
# 150k passwords per second against a good box. This means that you should
# use a very strong password otherwise it will be very easy to break.
#
# requirepass foobared

# Require clients to issue ADMIN <PASSWORD> before processing any other
# needed admin right commands. This might be useful to prevent users from 
# doing some dangerous actions to the host running Vire.
#
# This should stay commented out for backward compatibility and because most
# people do not need auth (e.g. they run their own servers).
#
# Warning: since Redis is pretty fast an outside user can try up to
# 150k passwords per second against a good box. This means that you should
# use a very strong password otherwise it will be very easy to break.
#
# adminpass iamadmin

# Make some commands need adminpass to execute. Those commands just allowed 
# administrator to execute. This might be useful to prevent users from 
# doing some dangerous actions to the host running Vire.
#
# commands-need-adminpass flushall flushdb keys config

################################### CLIENTS ####################################

# Set the max number of connected clients at the same time. By default
# this limit is set to 10000 clients, however if the Redis server is not
# able to configure the process file limit to allow for the specified limit
# the max number of allowed clients is set to the current file limit
# minus 32 (as Redis reserves a few file descriptors for internal uses).
#
# Once the limit is reached Redis will close all the new connections sending
# an error 'max number of clients reached'.
#
# maxclients 10000

############################## MEMORY MANAGEMENT ################################

# Don't use more memory than the specified amount of bytes.
# When the memory limit is reached Vire will try to remove keys
# according to the eviction policy selected (see maxmemory-policy).
#
# If Vire can't remove keys according to the policy, or if the policy is
# set to 'noeviction', Vire will start to reply with errors to commands
# that would use more memory, like SET, LPUSH, and so on, and will continue
# to reply to read-only commands like GET.
#
# This option is usually useful when using Vire as an LRU cache, or to set
# a hard memory limit for an instance (using the 'noeviction' policy).
#
# WARNING: If you have slaves attached to an instance with maxmemory on,
# the size of the output buffers needed to feed the slaves are subtracted
# from the used memory count, so that network problems / resyncs will
# not trigger a loop where keys are evicted, and in turn the output
# buffer of slaves is full with DELs of keys evicted triggering the deletion
# of more keys, and so forth until the database is completely emptied.
#
# In short... if you have slaves attached it is suggested that you set a lower
# limit for maxmemory so that there is some free RAM on the system for slave
# output buffers (but this is not needed if the policy is 'noeviction').
#
# maxmemory <bytes>

# MAXMEMORY POLICY: how Vire will select what to remove when maxmemory
# is reached. You can select among five behaviors:
#
# volatile-lru -> remove the key with an expire set using an LRU algorithm, not support now
# allkeys-lru -> remove any key according to the LRU algorithm, not support now
# volatile-random -> remove a random key with an expire set
# allkeys-random -> remove a random key, any key
# volatile-ttl -> remove the key with the nearest expire time (minor TTL)
# noeviction -> don't expire at all, just return an error on write operations
#
# Note: with any of the above policies, Vire will return an error on write
#       operations, when there are no suitable keys for eviction.
#
#       At the date of writing these commands are: set setnx setex append
#       incr decr rpush lpush rpushx lpushx linsert lset rpoplpush sadd
#       sinter sinterstore sunion sunionstore sdiff sdiffstore zadd zincrby
#       zunionstore zinterstore hset hsetnx hmset hincrby incrby decrby
#       getset mset msetnx exec sort
#
# The default is:
#
# maxmemory-policy noeviction

# LRU and minimal TTL algorithms are not precise algorithms but approximated
# algorithms (in order to save memory), so you can tune it for speed or
# accuracy. For default Vire will check five keys and pick the one that was
# used less recently, you can change the sample size using the following
# configuration directive.
#
# The default of 5 produces good enough results. 10 Approximates very closely
# true LRU but costs a bit more CPU. 3 is very fast but not very accurate.
#
# maxmemory-samples 5

# Max time complexity limit for the commands that their time complexity is O(n).
#
# If n is bigger than max-time-complexity-limit, an error is returned for the client.
# The default of 0 means unlimited.
#
#       At the date of affected commands are: keys
# 
# max-time-complexity-limit 0

################################## SLOW LOG ###################################

# The Vire Slow Log is a system to log queries that exceeded a specified
# execution time. The execution time does not include the I/O operations
# like talking with the client, sending the reply and so forth,
# but just the time needed to actually execute the command (this is the only
# stage of command execution where the thread is blocked and can not serve
# other requests in the meantime).
#
# You can configure the slow log with two parameters: one tells Vire
# what is the execution time, in microseconds, to exceed in order for the
# command to get logged, and the other parameter is the length of the
# slow log. When a new command is logged the oldest one is removed from the
# queue of logged commands.

# The following time is expressed in microseconds, so 1000000 is equivalent
# to one second. Note that a negative number disables the slow log, while
# a value of zero forces the logging of every command.
slowlog-log-slower-than 10000

# There is no limit to this length. Just be aware that it will consume memory.
# You can reclaim memory used by the slow log with SLOWLOG RESET.
slowlog-max-len 128

================================================
FILE: configure.ac
================================================
# Define the package version numbers and the bug reporting address
m4_define([VR_MAJOR], 1)
m4_define([VR_MINOR], 0)
m4_define([VR_PATCH], 0)
m4_define([VR_BUGS], [diguo58@gmail.com])

# Initialize autoconf
AC_PREREQ([2.63])
AC_INIT([vire], [VR_MAJOR.VR_MINOR.VR_PATCH], [VR_BUGS])
AC_CONFIG_SRCDIR([src/vr.c])
AC_CONFIG_AUX_DIR([config])
AC_CONFIG_HEADERS([config.h:config.h.in])
AC_CONFIG_MACRO_DIR([m4])

# Initialize automake
AM_INIT_AUTOMAKE([1.9 foreign])

# Define macro variables for the package version numbers
AC_DEFINE(VR_VERSION_MAJOR, VR_MAJOR, [Define the major version number])
AC_DEFINE(VR_VERSION_MINOR, VR_MINOR, [Define the minor version number])
AC_DEFINE(VR_VERSION_PATCH, VR_PATCH, [Define the patch version number])
AC_DEFINE(VR_VERSION_STRING, "VR_MAJOR.VR_MINOR.VR_PATCH", [Define the version string])

# Checks for language
AC_LANG([C])

# Checks for programs
AC_PROG_AWK
AC_PROG_CC
AC_PROG_CPP
AC_PROG_CXX
AC_PROG_INSTALL
AC_PROG_LN_S
AC_PROG_MAKE_SET
AC_PROG_RANLIB
AC_PROG_LIBTOOL

# Checks for typedefs, structures, and compiler characteristics
AC_C_INLINE
AC_TYPE_INT8_T
AC_TYPE_INT16_T
AC_TYPE_INT32_T
AC_TYPE_INT64_T
AC_TYPE_INTMAX_T
AC_TYPE_INTPTR_T
AC_TYPE_UINT8_T
AC_TYPE_UINT16_T
AC_TYPE_UINT32_T
AC_TYPE_UINT64_T
AC_TYPE_UINTMAX_T
AC_TYPE_UINTPTR_T
AC_TYPE_OFF_T
AC_TYPE_PID_T
AC_TYPE_SIZE_T
AC_TYPE_SSIZE_T

AC_C_BIGENDIAN(
  [],
  [AC_DEFINE(HAVE_LITTLE_ENDIAN, 1, [Define to 1 if machine is little endian])],
  [AC_MSG_ERROR([endianess of this machine is unknown])],
  [AC_MSG_ERROR([universial endianess not supported])]
)

# Checks for header files
AC_HEADER_STDBOOL
AC_CHECK_HEADERS([fcntl.h float.h limits.h stddef.h stdlib.h string.h unistd.h])
AC_CHECK_HEADERS([inttypes.h stdint.h])
AC_CHECK_HEADERS([sys/ioctl.h sys/time.h sys/uio.h])
AC_CHECK_HEADERS([sys/socket.h sys/un.h netinet/in.h arpa/inet.h netdb.h])
AC_CHECK_HEADERS([execinfo.h],
  [AC_DEFINE(HAVE_BACKTRACE, [1], [Define to 1 if backtrace is supported])], [])
AC_CHECK_HEADERS([sys/epoll.h], [], [])
AC_CHECK_HEADERS([sys/event.h], [], [])

# Checks for libraries
AC_CHECK_LIB([m], [pow])
AC_CHECK_LIB([pthread], [pthread_create])

# Checks for library functions
AC_FUNC_FORK
AC_FUNC_MALLOC
AC_FUNC_REALLOC
AC_CHECK_FUNCS([dup2 gethostname gettimeofday strerror])
AC_CHECK_FUNCS([socket])
AC_CHECK_FUNCS([memchr memmove memset])
AC_CHECK_FUNCS([strchr strndup strtoul])

AC_CACHE_CHECK([if epoll works], [ac_cv_epoll_works],
  AC_TRY_RUN([
#include <stdio.h>
#include <stdlib.h>
#include <sys/epoll.h>
int
main(int argc, char **argv)
{
    int fd;

    fd = epoll_create(256);
    if (fd < 0) {
        perror("epoll_create:");
        exit(1);
    }
    exit(0);
}
  ], [ac_cv_epoll_works=yes], [ac_cv_epoll_works=no]))
AS_IF([test "x$ac_cv_epoll_works" = "xyes"],
  [AC_DEFINE([HAVE_EPOLL], [1], [Define to 1 if epoll is supported])], [])

AC_CACHE_CHECK([if kqueue works], [ac_cv_kqueue_works],
  AC_TRY_RUN([
#include <stdio.h>
#include <stdlib.h>
#include <sys/types.h>
#include <sys/event.h>
#include <sys/time.h>
int
main(int argc, char **argv)
{
    int fd;

    fd = kqueue();
    if (fd < 0) {
        perror("kqueue:");
        exit(1);
    }
    exit(0);
}
  ], [ac_cv_kqueue_works=yes], [ac_cv_kqueue_works=no]))
AS_IF([test "x$ac_cv_kqueue_works" = "xyes"],
  [AC_DEFINE([HAVE_KQUEUE], [1], [Define to 1 if kqueue is supported])], [])

AC_CACHE_CHECK([if event ports works], [ac_cv_evports_works],
  AC_TRY_RUN([
#include <stdio.h>
#include <stdlib.h>
#include <port.h>
int
main(int argc, char **argv)
{
    int fd;

    fd = port_create();
    if (fd < 0) {
        perror("port_create:");
        exit(1);
    }
    exit(0);
}
  ], [ac_cv_evports_works=yes], [ac_cv_evports_works=no]))
AS_IF([test "x$ac_cv_evports_works" = "xyes"],
  [AC_DEFINE([HAVE_EVENT_PORTS], [1], [Define to 1 if event ports is supported])], [])

AS_IF([test "x$ac_cv_epoll_works" = "xno" &&
       test "x$ac_cv_kqueue_works" = "xno" &&
       test "x$ac_cv_evports_works" = "xno"],
  [AC_MSG_ERROR([either epoll or kqueue or event ports support is required])], [])

AM_CONDITIONAL([OS_LINUX], [test "x$ac_cv_epoll_works" = "xyes"])
AM_CONDITIONAL([OS_BSD], [test "x$ac_cv_kqueue_works" = "xyes"])
AM_CONDITIONAL([OS_SOLARIS], [test "x$ac_cv_evports_works" = "xyes"])
AM_CONDITIONAL([OS_FREEBSD], [test "$(uname -v | cut -c 1-10)" == "FreeBSD 10"])
AM_CONDITIONAL([OS_DARWIN], [test "$(uname -v | cut -c 1-6)" == "Darwin"])

# Package options
AC_MSG_CHECKING([whether to enable debug logs and asserts])
AC_ARG_ENABLE([debug],
  [AS_HELP_STRING(
    [--enable-debug=@<:@full|yes|log|no@:>@],
    [enable debug logs and asserts @<:@default=no@:>@])
  ],
  [],
  [enable_debug=no])
AS_CASE([x$enable_debug],
  [xfull], [AC_DEFINE([HAVE_ASSERT_PANIC], [1],
                      [Define to 1 if panic on an assert is enabled])
            AC_DEFINE([HAVE_DEBUG_LOG], [1], [Define to 1 if debug log is enabled])
           ],
  [xyes], [AC_DEFINE([HAVE_ASSERT_LOG], [1],
                     [Define to 1 if log on an assert is enabled])
           AC_DEFINE([HAVE_DEBUG_LOG], [1], [Define to 1 if debug log is enabled])
          ],
  [xlog], [AC_DEFINE([HAVE_DEBUG_LOG], [1], [Define to 1 if debug log is enabled])],
  [xno], [],
  [AC_MSG_FAILURE([invalid value ${enable_debug} for --enable-debug])])
AC_MSG_RESULT($enable_debug)

AC_MSG_CHECKING([whether to disable spinlock])
AC_ARG_ENABLE([spinlock],
  [AS_HELP_STRING(
    [--disable-spinlock],
    [disable spinlock])
  ],
  [disable_spinlock=yes],
  [disable_spinlock=no])
AS_IF([test "x$disable_spinlock" = xyes],
  [],
  [AC_DEFINE([HAVE_SPINLOCK], [1], [Define to 1 if spinlock is not disabled])])
AC_MSG_RESULT($disable_spinlock)

AC_MSG_CHECKING([whether to use jemalloc])
AC_ARG_WITH([jemalloc],
  AS_HELP_STRING([--with-jemalloc@<:@=yes|no@:>@],
    [use jemalloc(default use jemalloc)]),
  [
    if test "$withval" = "no"; then
      enable_jemalloc=no
    else
	  enable_jemalloc=yes
    fi
  ],
  [enable_jemalloc=yes])
AS_IF([test "x$enable_jemalloc" = xyes],
  [AC_DEFINE([HAVE_JEMALLOC], [1], [Define to 1 if jemalloc is used])],
  [])
AC_MSG_RESULT($enable_jemalloc)

# Untar the jemalloc-4.2.0.tar.bz2 in dep/ before config.status is rerun
# Run configure in dep/jemalloc-4.2.0
AC_CONFIG_COMMANDS_PRE([rm -rf dep/jemalloc-4.2.0])
AC_CONFIG_COMMANDS_PRE([mkdir dep/jemalloc-4.2.0])
AC_CONFIG_COMMANDS_PRE([tar xvjf dep/jemalloc-4.2.0.tar.bz2 -C dep])
AC_CONFIG_COMMANDS_PRE([cd dep/jemalloc-4.2.0])
AC_CONFIG_COMMANDS_PRE([./configure --with-jemalloc-prefix=je_])
AC_CONFIG_COMMANDS_PRE([cd ../..])

# Untar the hiredis-0.13.3.tar.gz in dep/ before config.status is rerun
AC_CONFIG_COMMANDS_PRE([rm -rf dep/hiredis-0.13.3])
AC_CONFIG_COMMANDS_PRE([mkdir dep/hiredis-0.13.3])
AC_CONFIG_COMMANDS_PRE([tar zxvf dep/hiredis-0.13.3.tar.gz -C dep])
AC_CONFIG_COMMANDS_PRE([cd dep/hiredis-0.13.3])
AC_CONFIG_COMMANDS_PRE([cd ../..])

# Define Makefiles
AC_CONFIG_FILES([Makefile
                 dep/Makefile
                 dep/util/Makefile
                 dep/dhashkit/Makefile
                 dep/dmalloc/Makefile
                 dep/sds/Makefile
                 dep/ae/Makefile
                 dep/dlist/Makefile
                 dep/darray/Makefile
                 dep/himemcached-0.1.0/Makefile
                 src/Makefile
                 tests/Makefile])

# Generate the "configure" script
AC_OUTPUT


================================================
FILE: dep/.gitignore
================================================
!*.tar.gz

================================================
FILE: dep/Makefile.am
================================================
SUBDIRS = jemalloc-4.2.0 hiredis-0.13.3 himemcached-0.1.0 util dhashkit dmalloc ae sds dlist darray

EXTRA_DIST = jemalloc-4.2.0.tar.bz2 hiredis-0.13.3.tar.gz


================================================
FILE: dep/ae/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CPPFLAGS =
if !OS_SOLARIS
AM_CPPFLAGS += -D_GNU_SOURCE
endif
AM_CPPFLAGS += -I $(top_srcdir)/dep/util
AM_CPPFLAGS += -I $(top_srcdir)/dep/jemalloc-4.2.0/include
AM_CPPFLAGS += -I $(top_srcdir)/dep/dmalloc

AM_CFLAGS = -Wall -Wshadow
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value

noinst_LIBRARIES = libae.a

noinst_HEADERS = ae.h

libae_a_SOURCES =	\
	ae.c ae.h

================================================
FILE: dep/ae/ae.c
================================================
/* A simple event-driven programming library. Originally I wrote this code
 * for the Jim's event-loop (Jim is a Tcl interpreter) but later translated
 * it in form of a library for easy reuse.
 *
 * Copyright (c) 2006-2010, Salvatore Sanfilippo <antirez at gmail dot com>
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#include <stdio.h>
#include <sys/time.h>
#include <sys/types.h>
#include <unistd.h>
#include <stdlib.h>
#include <poll.h>
#include <string.h>
#include <time.h>
#include <errno.h>

#include <dmalloc.h>

#include <ae.h>

#ifdef HAVE_CONFIG_H
# include <config.h>
#endif

/* Include the best multiplexing layer supported by this system.
 * The following should be ordered by performances, descending. */
#ifdef HAVE_EVENT_PORTS
#include "ae_evport.c"
#else
    #ifdef HAVE_EPOLL
    #include "ae_epoll.c"
    #else
        #ifdef HAVE_KQUEUE
        #include "ae_kqueue.c"
        #else
        #include "ae_select.c"
        #endif
    #endif
#endif

aeEventLoop *aeCreateEventLoop(int setsize) {
    aeEventLoop *eventLoop;
    int i;

    if ((eventLoop = dalloc(sizeof(*eventLoop))) == NULL) goto err;
    eventLoop->events = dalloc(sizeof(aeFileEvent)*setsize);
    eventLoop->fired = dalloc(sizeof(aeFiredEvent)*setsize);
    if (eventLoop->events == NULL || eventLoop->fired == NULL) goto err;
    eventLoop->setsize = setsize;
    eventLoop->lastTime = time(NULL);
    eventLoop->timeEventHead = NULL;
    eventLoop->timeEventNextId = 0;
    eventLoop->stop = 0;
    eventLoop->maxfd = -1;
    eventLoop->beforesleep = NULL;
    eventLoop->bsdata = NULL;
    if (aeApiCreate(eventLoop) == -1) goto err;
    /* Events with mask == AE_NONE are not set. So let's initialize the
     * vector with it. */
    for (i = 0; i < setsize; i++)
        eventLoop->events[i].mask = AE_NONE;
    return eventLoop;

err:
    if (eventLoop) {
        dfree(eventLoop->events);
        dfree(eventLoop->fired);
        dfree(eventLoop);
    }
    return NULL;
}

/* Return the current set size. */
int aeGetSetSize(aeEventLoop *eventLoop) {
    return eventLoop->setsize;
}

/* Resize the maximum set size of the event loop.
 * If the requested set size is smaller than the current set size, but
 * there is already a file descriptor in use that is >= the requested
 * set size minus one, AE_ERR is returned and the operation is not
 * performed at all.
 *
 * Otherwise AE_OK is returned and the operation is successful. */
int aeResizeSetSize(aeEventLoop *eventLoop, int setsize) {
    int i;

    if (setsize == eventLoop->setsize) return AE_OK;
    if (eventLoop->maxfd >= setsize) return AE_ERR;
    if (aeApiResize(eventLoop,setsize) == -1) return AE_ERR;

    eventLoop->events = drealloc(eventLoop->events,sizeof(aeFileEvent)*setsize);
    eventLoop->fired = drealloc(eventLoop->fired,sizeof(aeFiredEvent)*setsize);
    eventLoop->setsize = setsize;

    /* Make sure that if we created new slots, they are initialized with
     * an AE_NONE mask. */
    for (i = eventLoop->maxfd+1; i < setsize; i++)
        eventLoop->events[i].mask = AE_NONE;
    return AE_OK;
}

void aeDeleteEventLoop(aeEventLoop *eventLoop) {
    aeApiFree(eventLoop);
    dfree(eventLoop->events);
    dfree(eventLoop->fired);
    dfree(eventLoop);
}

void aeStop(aeEventLoop *eventLoop) {
    eventLoop->stop = 1;
}

int aeCreateFileEvent(aeEventLoop *eventLoop, int fd, int mask,
        aeFileProc *proc, void *clientData)
{
    if (fd >= eventLoop->setsize) {
        if (aeResizeSetSize(eventLoop,fd+1000) != AE_OK) {
            return AE_ERR;
        }
    }
    aeFileEvent *fe = &eventLoop->events[fd];

    if (aeApiAddEvent(eventLoop, fd, mask) == -1)
        return AE_ERR;
    fe->mask |= mask;
    if (mask & AE_READABLE) fe->rfileProc = proc;
    if (mask & AE_WRITABLE) fe->wfileProc = proc;
    fe->clientData = clientData;
    if (fd > eventLoop->maxfd)
        eventLoop->maxfd = fd;
    return AE_OK;
}

void aeDeleteFileEvent(aeEventLoop *eventLoop, int fd, int mask)
{
    if (fd >= eventLoop->setsize) return;
    aeFileEvent *fe = &eventLoop->events[fd];
    if (fe->mask == AE_NONE) return;

    aeApiDelEvent(eventLoop, fd, mask);
    fe->mask = fe->mask & (~mask);
    if (fd == eventLoop->maxfd && fe->mask == AE_NONE) {
        /* Update the max fd */
        int j;

        for (j = eventLoop->maxfd-1; j >= 0; j--)
            if (eventLoop->events[j].mask != AE_NONE) break;
        eventLoop->maxfd = j;
    }
}

int aeGetFileEvents(aeEventLoop *eventLoop, int fd) {
    if (fd >= eventLoop->setsize) return 0;
    aeFileEvent *fe = &eventLoop->events[fd];

    return fe->mask;
}

static void aeGetTime(long *seconds, long *milliseconds)
{
    struct timeval tv;

    gettimeofday(&tv, NULL);
    *seconds = tv.tv_sec;
    *milliseconds = tv.tv_usec/1000;
}

static void aeAddMillisecondsToNow(long long milliseconds, long *sec, long *ms) {
    long cur_sec, cur_ms, when_sec, when_ms;

    aeGetTime(&cur_sec, &cur_ms);
    when_sec = cur_sec + milliseconds/1000;
    when_ms = cur_ms + milliseconds%1000;
    if (when_ms >= 1000) {
        when_sec ++;
        when_ms -= 1000;
    }
    *sec = when_sec;
    *ms = when_ms;
}

long long aeCreateTimeEvent(aeEventLoop *eventLoop, long long milliseconds,
        aeTimeProc *proc, void *clientData,
        aeEventFinalizerProc *finalizerProc)
{
    long long id = eventLoop->timeEventNextId++;
    aeTimeEvent *te;

    te = dalloc(sizeof(*te));
    if (te == NULL) return AE_ERR;
    te->id = id;
    aeAddMillisecondsToNow(milliseconds,&te->when_sec,&te->when_ms);
    te->timeProc = proc;
    te->finalizerProc = finalizerProc;
    te->clientData = clientData;
    te->next = eventLoop->timeEventHead;
    eventLoop->timeEventHead = te;
    return id;
}

int aeDeleteTimeEvent(aeEventLoop *eventLoop, long long id)
{
    aeTimeEvent *te = eventLoop->timeEventHead;
    while(te) {
        if (te->id == id) {
            te->id = AE_DELETED_EVENT_ID;
            return AE_OK;
        }
        te = te->next;
    }
    return AE_ERR; /* NO event with the specified ID found */
}

/* Search the first timer to fire.
 * This operation is useful to know how many time the select can be
 * put in sleep without to delay any event.
 * If there are no timers NULL is returned.
 *
 * Note that's O(N) since time events are unsorted.
 * Possible optimizations (not needed by Redis so far, but...):
 * 1) Insert the event in order, so that the nearest is just the head.
 *    Much better but still insertion or deletion of timers is O(N).
 * 2) Use a skiplist to have this operation as O(1) and insertion as O(log(N)).
 */
static aeTimeEvent *aeSearchNearestTimer(aeEventLoop *eventLoop)
{
    aeTimeEvent *te = eventLoop->timeEventHead;
    aeTimeEvent *nearest = NULL;

    while(te) {
        if (!nearest || te->when_sec < nearest->when_sec ||
                (te->when_sec == nearest->when_sec &&
                 te->when_ms < nearest->when_ms))
            nearest = te;
        te = te->next;
    }
    return nearest;
}

/* Process time events */
static int processTimeEvents(aeEventLoop *eventLoop) {
    int processed = 0;
    aeTimeEvent *te, *prev;
    long long maxId;
    time_t now = time(NULL);

    /* If the system clock is moved to the future, and then set back to the
     * right value, time events may be delayed in a random way. Often this
     * means that scheduled operations will not be performed soon enough.
     *
     * Here we try to detect system clock skews, and force all the time
     * events to be processed ASAP when this happens: the idea is that
     * processing events earlier is less dangerous than delaying them
     * indefinitely, and practice suggests it is. */
    if (now < eventLoop->lastTime) {
        te = eventLoop->timeEventHead;
        while(te) {
            te->when_sec = 0;
            te = te->next;
        }
    }
    eventLoop->lastTime = now;

    prev = NULL;
    te = eventLoop->timeEventHead;
    maxId = eventLoop->timeEventNextId-1;
    while(te) {
        long now_sec, now_ms;
        long long id;

        /* Remove events scheduled for deletion. */
        if (te->id == AE_DELETED_EVENT_ID) {
            aeTimeEvent *next = te->next;
            if (prev == NULL)
                eventLoop->timeEventHead = te->next;
            else
                prev->next = te->next;
            if (te->finalizerProc)
                te->finalizerProc(eventLoop, te->clientData);
            dfree(te);
            te = next;
            continue;
        }

        /* Make sure we don't process time events created by time events in
         * this iteration. Note that this check is currently useless: we always
         * add new timers on the head, however if we change the implementation
         * detail, this check may be useful again: we keep it here for future
         * defense. */
        if (te->id > maxId) {
            te = te->next;
            continue;
        }
        aeGetTime(&now_sec, &now_ms);
        if (now_sec > te->when_sec ||
            (now_sec == te->when_sec && now_ms >= te->when_ms))
        {
            int retval;

            id = te->id;
            retval = te->timeProc(eventLoop, id, te->clientData);
            processed++;
            if (retval != AE_NOMORE) {
                aeAddMillisecondsToNow(retval,&te->when_sec,&te->when_ms);
            } else {
                te->id = AE_DELETED_EVENT_ID;
            }
        }
        prev = te;
        te = te->next;
    }
    return processed;
}

/* Process every pending time event, then every pending file event
 * (that may be registered by time event callbacks just processed).
 * Without special flags the function sleeps until some file event
 * fires, or when the next time event occurs (if any).
 *
 * If flags is 0, the function does nothing and returns.
 * if flags has AE_ALL_EVENTS set, all the kind of events are processed.
 * if flags has AE_FILE_EVENTS set, file events are processed.
 * if flags has AE_TIME_EVENTS set, time events are processed.
 * if flags has AE_DONT_WAIT set the function returns ASAP until all
 * the events that's possible to process without to wait are processed.
 *
 * The function returns the number of events processed. */
int aeProcessEvents(aeEventLoop *eventLoop, int flags)
{
    int processed = 0, numevents;

    /* Nothing to do? return ASAP */
    if (!(flags & AE_TIME_EVENTS) && !(flags & AE_FILE_EVENTS)) return 0;

    /* Note that we want call select() even if there are no
     * file events to process as long as we want to process time
     * events, in order to sleep until the next time event is ready
     * to fire. */
    if (eventLoop->maxfd != -1 ||
        ((flags & AE_TIME_EVENTS) && !(flags & AE_DONT_WAIT))) {
        int j;
        aeTimeEvent *shortest = NULL;
        struct timeval tv, *tvp;

        if (flags & AE_TIME_EVENTS && !(flags & AE_DONT_WAIT))
            shortest = aeSearchNearestTimer(eventLoop);
        if (shortest) {
            long now_sec, now_ms;

            aeGetTime(&now_sec, &now_ms);
            tvp = &tv;

            /* How many milliseconds we need to wait for the next
             * time event to fire? */
            long long ms =
                (shortest->when_sec - now_sec)*1000 +
                shortest->when_ms - now_ms;

            if (ms > 0) {
                tvp->tv_sec = ms/1000;
                tvp->tv_usec = (ms % 1000)*1000;
            } else {
                tvp->tv_sec = 0;
                tvp->tv_usec = 0;
            }
        } else {
            /* If we have to check for events but need to return
             * ASAP because of AE_DONT_WAIT we need to set the timeout
             * to zero */
            if (flags & AE_DONT_WAIT) {
                tv.tv_sec = tv.tv_usec = 0;
                tvp = &tv;
            } else {
                /* Otherwise we can block */
                tvp = NULL; /* wait forever */
            }
        }

        numevents = aeApiPoll(eventLoop, tvp);
        for (j = 0; j < numevents; j++) {
            aeFileEvent *fe = &eventLoop->events[eventLoop->fired[j].fd];
            int mask = eventLoop->fired[j].mask;
            int fd = eventLoop->fired[j].fd;
            int rfired = 0;

	    /* note the fe->mask & mask & ... code: maybe an already processed
             * event removed an element that fired and we still didn't
             * processed, so we check if the event is still valid. */
            if (fe->mask & mask & AE_READABLE) {
                rfired = 1;
                fe->rfileProc(eventLoop,fd,fe->clientData,mask);
            }
            if (fe->mask & mask & AE_WRITABLE) {
                if (!rfired || fe->wfileProc != fe->rfileProc)
                    fe->wfileProc(eventLoop,fd,fe->clientData,mask);
            }
            processed++;
        }
    }
    /* Check time events */
    if (flags & AE_TIME_EVENTS)
        processed += processTimeEvents(eventLoop);

    return processed; /* return the number of processed file/time events */
}

/* Wait for milliseconds until the given file descriptor becomes
 * writable/readable/exception */
int aeWait(int fd, int mask, long long milliseconds) {
    struct pollfd pfd;
    int retmask = 0, retval;

    memset(&pfd, 0, sizeof(pfd));
    pfd.fd = fd;
    if (mask & AE_READABLE) pfd.events |= POLLIN;
    if (mask & AE_WRITABLE) pfd.events |= POLLOUT;

    if ((retval = poll(&pfd, 1, milliseconds))== 1) {
        if (pfd.revents & POLLIN) retmask |= AE_READABLE;
        if (pfd.revents & POLLOUT) retmask |= AE_WRITABLE;
	if (pfd.revents & POLLERR) retmask |= AE_WRITABLE;
        if (pfd.revents & POLLHUP) retmask |= AE_WRITABLE;
        return retmask;
    } else {
        return retval;
    }
}

void aeMain(aeEventLoop *eventLoop) {
    eventLoop->stop = 0;
    while (!eventLoop->stop) {
        if (eventLoop->beforesleep != NULL)
            eventLoop->beforesleep(eventLoop, eventLoop->bsdata);
        aeProcessEvents(eventLoop, AE_ALL_EVENTS);
    }
}

char *aeGetApiName(void) {
    return aeApiName();
}

void aeSetBeforeSleepProc(aeEventLoop *eventLoop, aeBeforeSleepProc *beforesleep, void *private_data) {
    eventLoop->beforesleep = beforesleep;
    eventLoop->bsdata = private_data;
}


================================================
FILE: dep/ae/ae.h
================================================
/* A simple event-driven programming library. Originally I wrote this code
 * for the Jim's event-loop (Jim is a Tcl interpreter) but later translated
 * it in form of a library for easy reuse.
 *
 * Copyright (c) 2006-2012, Salvatore Sanfilippo <antirez at gmail dot com>
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#ifndef __AE_H__
#define __AE_H__

#include <time.h>

#define AE_OK 0
#define AE_ERR -1

#define AE_NONE 0
#define AE_READABLE 1
#define AE_WRITABLE 2

#define AE_FILE_EVENTS 1
#define AE_TIME_EVENTS 2
#define AE_ALL_EVENTS (AE_FILE_EVENTS|AE_TIME_EVENTS)
#define AE_DONT_WAIT 4

#define AE_NOMORE -1
#define AE_DELETED_EVENT_ID -1

/* Macros */
#define AE_NOTUSED(V) ((void) V)

struct aeEventLoop;

/* Types and data structures */
typedef void aeFileProc(struct aeEventLoop *eventLoop, int fd, void *clientData, int mask);
typedef int aeTimeProc(struct aeEventLoop *eventLoop, long long id, void *clientData);
typedef void aeEventFinalizerProc(struct aeEventLoop *eventLoop, void *clientData);
typedef void aeBeforeSleepProc(struct aeEventLoop *eventLoop, void *private_data);

/* File event structure */
typedef struct aeFileEvent {
    int mask; /* one of AE_(READABLE|WRITABLE) */
    aeFileProc *rfileProc;
    aeFileProc *wfileProc;
    void *clientData;
} aeFileEvent;

/* Time event structure */
typedef struct aeTimeEvent {
    long long id; /* time event identifier. */
    long when_sec; /* seconds */
    long when_ms; /* milliseconds */
    aeTimeProc *timeProc;
    aeEventFinalizerProc *finalizerProc;
    void *clientData;
    struct aeTimeEvent *next;
} aeTimeEvent;

/* A fired event */
typedef struct aeFiredEvent {
    int fd;
    int mask;
} aeFiredEvent;

/* State of an event based program */
typedef struct aeEventLoop {
    int maxfd;   /* highest file descriptor currently registered */
    int setsize; /* max number of file descriptors tracked */
    long long timeEventNextId;
    time_t lastTime;     /* Used to detect system clock skew */
    aeFileEvent *events; /* Registered events */
    aeFiredEvent *fired; /* Fired events */
    aeTimeEvent *timeEventHead;
    int stop;
    void *apidata; /* This is used for polling API specific data */
    aeBeforeSleepProc *beforesleep;
    void *bsdata; /* This is used for beforesleep private data */
} aeEventLoop;

/* Prototypes */
aeEventLoop *aeCreateEventLoop(int setsize);
void aeDeleteEventLoop(aeEventLoop *eventLoop);
void aeStop(aeEventLoop *eventLoop);
int aeCreateFileEvent(aeEventLoop *eventLoop, int fd, int mask,
        aeFileProc *proc, void *clientData);
void aeDeleteFileEvent(aeEventLoop *eventLoop, int fd, int mask);
int aeGetFileEvents(aeEventLoop *eventLoop, int fd);
long long aeCreateTimeEvent(aeEventLoop *eventLoop, long long milliseconds,
        aeTimeProc *proc, void *clientData,
        aeEventFinalizerProc *finalizerProc);
int aeDeleteTimeEvent(aeEventLoop *eventLoop, long long id);
int aeProcessEvents(aeEventLoop *eventLoop, int flags);
int aeWait(int fd, int mask, long long milliseconds);
void aeMain(aeEventLoop *eventLoop);
char *aeGetApiName(void);
void aeSetBeforeSleepProc(aeEventLoop *eventLoop, aeBeforeSleepProc *beforesleep, void *private_data);
int aeGetSetSize(aeEventLoop *eventLoop);
int aeResizeSetSize(aeEventLoop *eventLoop, int setsize);

#endif


================================================
FILE: dep/ae/ae_epoll.c
================================================
/* Linux epoll(2) based ae.c module
 *
 * Copyright (c) 2009-2012, Salvatore Sanfilippo <antirez at gmail dot com>
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */


#include <sys/epoll.h>

typedef struct aeApiState {
    int epfd;
    struct epoll_event *events;
} aeApiState;

static int aeApiCreate(aeEventLoop *eventLoop) {
    aeApiState *state = dalloc(sizeof(aeApiState));

    if (!state) return -1;
    state->events = dalloc(sizeof(struct epoll_event)*eventLoop->setsize);
    if (!state->events) {
        dfree(state);
        return -1;
    }
    state->epfd = epoll_create(1024); /* 1024 is just a hint for the kernel */
    if (state->epfd == -1) {
        dfree(state->events);
        dfree(state);
        return -1;
    }
    eventLoop->apidata = state;
    return 0;
}

static int aeApiResize(aeEventLoop *eventLoop, int setsize) {
    aeApiState *state = eventLoop->apidata;

    state->events = drealloc(state->events, sizeof(struct epoll_event)*setsize);
    return 0;
}

static void aeApiFree(aeEventLoop *eventLoop) {
    aeApiState *state = eventLoop->apidata;

    close(state->epfd);
    dfree(state->events);
    dfree(state);
}

static int aeApiAddEvent(aeEventLoop *eventLoop, int fd, int mask) {
    aeApiState *state = eventLoop->apidata;
    struct epoll_event ee = {0}; /* avoid valgrind warning */
    /* If the fd was already monitored for some event, we need a MOD
     * operation. Otherwise we need an ADD operation. */
    int op = eventLoop->events[fd].mask == AE_NONE ?
            EPOLL_CTL_ADD : EPOLL_CTL_MOD;

    ee.events = 0;
    mask |= eventLoop->events[fd].mask; /* Merge old events */
    if (mask & AE_READABLE) ee.events |= EPOLLIN;
    if (mask & AE_WRITABLE) ee.events |= EPOLLOUT;
    ee.data.fd = fd;
    if (epoll_ctl(state->epfd,op,fd,&ee) == -1) return -1;
    return 0;
}

static void aeApiDelEvent(aeEventLoop *eventLoop, int fd, int delmask) {
    aeApiState *state = eventLoop->apidata;
    struct epoll_event ee = {0}; /* avoid valgrind warning */
    int mask = eventLoop->events[fd].mask & (~delmask);

    ee.events = 0;
    if (mask & AE_READABLE) ee.events |= EPOLLIN;
    if (mask & AE_WRITABLE) ee.events |= EPOLLOUT;
    ee.data.fd = fd;
    if (mask != AE_NONE) {
        epoll_ctl(state->epfd,EPOLL_CTL_MOD,fd,&ee);
    } else {
        /* Note, Kernel < 2.6.9 requires a non null event pointer even for
         * EPOLL_CTL_DEL. */
        epoll_ctl(state->epfd,EPOLL_CTL_DEL,fd,&ee);
    }
}

static int aeApiPoll(aeEventLoop *eventLoop, struct timeval *tvp) {
    aeApiState *state = eventLoop->apidata;
    int retval, numevents = 0;

    retval = epoll_wait(state->epfd,state->events,eventLoop->setsize,
            tvp ? (tvp->tv_sec*1000 + tvp->tv_usec/1000) : -1);
    if (retval > 0) {
        int j;

        numevents = retval;
        for (j = 0; j < numevents; j++) {
            int mask = 0;
            struct epoll_event *e = state->events+j;

            if (e->events & EPOLLIN) mask |= AE_READABLE;
            if (e->events & EPOLLOUT) mask |= AE_WRITABLE;
            if (e->events & EPOLLERR) mask |= AE_WRITABLE;
            if (e->events & EPOLLHUP) mask |= AE_WRITABLE;
            eventLoop->fired[j].fd = e->data.fd;
            eventLoop->fired[j].mask = mask;
        }
    }
    return numevents;
}

static char *aeApiName(void) {
    return "epoll";
}


================================================
FILE: dep/ae/ae_evport.c
================================================
/* ae.c module for illumos event ports.
 *
 * Copyright (c) 2012, Joyent, Inc. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */


#include <assert.h>
#include <errno.h>
#include <port.h>
#include <poll.h>

#include <sys/types.h>
#include <sys/time.h>

#include <stdio.h>

static int evport_debug = 0;

/*
 * This file implements the ae API using event ports, present on Solaris-based
 * systems since Solaris 10.  Using the event port interface, we associate file
 * descriptors with the port.  Each association also includes the set of poll(2)
 * events that the consumer is interested in (e.g., POLLIN and POLLOUT).
 *
 * There's one tricky piece to this implementation: when we return events via
 * aeApiPoll, the corresponding file descriptors become dissociated from the
 * port.  This is necessary because poll events are level-triggered, so if the
 * fd didn't become dissociated, it would immediately fire another event since
 * the underlying state hasn't changed yet.  We must re-associate the file
 * descriptor, but only after we know that our caller has actually read from it.
 * The ae API does not tell us exactly when that happens, but we do know that
 * it must happen by the time aeApiPoll is called again.  Our solution is to
 * keep track of the last fds returned by aeApiPoll and re-associate them next
 * time aeApiPoll is invoked.
 *
 * To summarize, in this module, each fd association is EITHER (a) represented
 * only via the in-kernel association OR (b) represented by pending_fds and
 * pending_masks.  (b) is only true for the last fds we returned from aeApiPoll,
 * and only until we enter aeApiPoll again (at which point we restore the
 * in-kernel association).
 */
#define MAX_EVENT_BATCHSZ 512

typedef struct aeApiState {
    int     portfd;                             /* event port */
    int     npending;                           /* # of pending fds */
    int     pending_fds[MAX_EVENT_BATCHSZ];     /* pending fds */
    int     pending_masks[MAX_EVENT_BATCHSZ];   /* pending fds' masks */
} aeApiState;

static int aeApiCreate(aeEventLoop *eventLoop) {
    int i;
    aeApiState *state = dalloc(sizeof(aeApiState));
    if (!state) return -1;

    state->portfd = port_create();
    if (state->portfd == -1) {
        dfree(state);
        return -1;
    }

    state->npending = 0;

    for (i = 0; i < MAX_EVENT_BATCHSZ; i++) {
        state->pending_fds[i] = -1;
        state->pending_masks[i] = AE_NONE;
    }

    eventLoop->apidata = state;
    return 0;
}

static int aeApiResize(aeEventLoop *eventLoop, int setsize) {
    /* Nothing to resize here. */
    return 0;
}

static void aeApiFree(aeEventLoop *eventLoop) {
    aeApiState *state = eventLoop->apidata;

    close(state->portfd);
    dfree(state);
}

static int aeApiLookupPending(aeApiState *state, int fd) {
    int i;

    for (i = 0; i < state->npending; i++) {
        if (state->pending_fds[i] == fd)
            return (i);
    }

    return (-1);
}

/*
 * Helper function to invoke port_associate for the given fd and mask.
 */
static int aeApiAssociate(const char *where, int portfd, int fd, int mask) {
    int events = 0;
    int rv, err;

    if (mask & AE_READABLE)
        events |= POLLIN;
    if (mask & AE_WRITABLE)
        events |= POLLOUT;

    if (evport_debug)
        fprintf(stderr, "%s: port_associate(%d, 0x%x) = ", where, fd, events);

    rv = port_associate(portfd, PORT_SOURCE_FD, fd, events,
        (void *)(uintptr_t)mask);
    err = errno;

    if (evport_debug)
        fprintf(stderr, "%d (%s)\n", rv, rv == 0 ? "no error" : strerror(err));

    if (rv == -1) {
        fprintf(stderr, "%s: port_associate: %s\n", where, strerror(err));

        if (err == EAGAIN)
            fprintf(stderr, "aeApiAssociate: event port limit exceeded.");
    }

    return rv;
}

static int aeApiAddEvent(aeEventLoop *eventLoop, int fd, int mask) {
    aeApiState *state = eventLoop->apidata;
    int fullmask, pfd;

    if (evport_debug)
        fprintf(stderr, "aeApiAddEvent: fd %d mask 0x%x\n", fd, mask);

    /*
     * Since port_associate's "events" argument replaces any existing events, we
     * must be sure to include whatever events are already associated when
     * we call port_associate() again.
     */
    fullmask = mask | eventLoop->events[fd].mask;
    pfd = aeApiLookupPending(state, fd);

    if (pfd != -1) {
        /*
         * This fd was recently returned from aeApiPoll.  It should be safe to
         * assume that the consumer has processed that poll event, but we play
         * it safer by simply updating pending_mask.  The fd will be
         * re-associated as usual when aeApiPoll is called again.
         */
        if (evport_debug)
            fprintf(stderr, "aeApiAddEvent: adding to pending fd %d\n", fd);
        state->pending_masks[pfd] |= fullmask;
        return 0;
    }

    return (aeApiAssociate("aeApiAddEvent", state->portfd, fd, fullmask));
}

static void aeApiDelEvent(aeEventLoop *eventLoop, int fd, int mask) {
    aeApiState *state = eventLoop->apidata;
    int fullmask, pfd;

    if (evport_debug)
        fprintf(stderr, "del fd %d mask 0x%x\n", fd, mask);

    pfd = aeApiLookupPending(state, fd);

    if (pfd != -1) {
        if (evport_debug)
            fprintf(stderr, "deleting event from pending fd %d\n", fd);

        /*
         * This fd was just returned from aeApiPoll, so it's not currently
         * associated with the port.  All we need to do is update
         * pending_mask appropriately.
         */
        state->pending_masks[pfd] &= ~mask;

        if (state->pending_masks[pfd] == AE_NONE)
            state->pending_fds[pfd] = -1;

        return;
    }

    /*
     * The fd is currently associated with the port.  Like with the add case
     * above, we must look at the full mask for the file descriptor before
     * updating that association.  We don't have a good way of knowing what the
     * events are without looking into the eventLoop state directly.  We rely on
     * the fact that our caller has already updated the mask in the eventLoop.
     */

    fullmask = eventLoop->events[fd].mask;
    if (fullmask == AE_NONE) {
        /*
         * We're removing *all* events, so use port_dissociate to remove the
         * association completely.  Failure here indicates a bug.
         */
        if (evport_debug)
            fprintf(stderr, "aeApiDelEvent: port_dissociate(%d)\n", fd);

        if (port_dissociate(state->portfd, PORT_SOURCE_FD, fd) != 0) {
            perror("aeApiDelEvent: port_dissociate");
            abort(); /* will not return */
        }
    } else if (aeApiAssociate("aeApiDelEvent", state->portfd, fd,
        fullmask) != 0) {
        /*
         * ENOMEM is a potentially transient condition, but the kernel won't
         * generally return it unless things are really bad.  EAGAIN indicates
         * we've reached an resource limit, for which it doesn't make sense to
         * retry (counter-intuitively).  All other errors indicate a bug.  In any
         * of these cases, the best we can do is to abort.
         */
        abort(); /* will not return */
    }
}

static int aeApiPoll(aeEventLoop *eventLoop, struct timeval *tvp) {
    aeApiState *state = eventLoop->apidata;
    struct timespec timeout, *tsp;
    int mask, i;
    uint_t nevents;
    port_event_t event[MAX_EVENT_BATCHSZ];

    /*
     * If we've returned fd events before, we must re-associate them with the
     * port now, before calling port_get().  See the block comment at the top of
     * this file for an explanation of why.
     */
    for (i = 0; i < state->npending; i++) {
        if (state->pending_fds[i] == -1)
            /* This fd has since been deleted. */
            continue;

        if (aeApiAssociate("aeApiPoll", state->portfd,
            state->pending_fds[i], state->pending_masks[i]) != 0) {
            /* See aeApiDelEvent for why this case is fatal. */
            abort();
        }

        state->pending_masks[i] = AE_NONE;
        state->pending_fds[i] = -1;
    }

    state->npending = 0;

    if (tvp != NULL) {
        timeout.tv_sec = tvp->tv_sec;
        timeout.tv_nsec = tvp->tv_usec * 1000;
        tsp = &timeout;
    } else {
        tsp = NULL;
    }

    /*
     * port_getn can return with errno == ETIME having returned some events (!).
     * So if we get ETIME, we check nevents, too.
     */
    nevents = 1;
    if (port_getn(state->portfd, event, MAX_EVENT_BATCHSZ, &nevents,
        tsp) == -1 && (errno != ETIME || nevents == 0)) {
        if (errno == ETIME || errno == EINTR)
            return 0;

        /* Any other error indicates a bug. */
        perror("aeApiPoll: port_get");
        abort();
    }

    state->npending = nevents;

    for (i = 0; i < nevents; i++) {
            mask = 0;
            if (event[i].portev_events & POLLIN)
                mask |= AE_READABLE;
            if (event[i].portev_events & POLLOUT)
                mask |= AE_WRITABLE;

            eventLoop->fired[i].fd = event[i].portev_object;
            eventLoop->fired[i].mask = mask;

            if (evport_debug)
                fprintf(stderr, "aeApiPoll: fd %d mask 0x%x\n",
                    (int)event[i].portev_object, mask);

            state->pending_fds[i] = event[i].portev_object;
            state->pending_masks[i] = (uintptr_t)event[i].portev_user;
    }

    return nevents;
}

static char *aeApiName(void) {
    return "evport";
}


================================================
FILE: dep/ae/ae_kqueue.c
================================================
/* Kqueue(2)-based ae.c module
 *
 * Copyright (C) 2009 Harish Mallipeddi - harish.mallipeddi@gmail.com
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */


#include <sys/types.h>
#include <sys/event.h>
#include <sys/time.h>

typedef struct aeApiState {
    int kqfd;
    struct kevent *events;
} aeApiState;

static int aeApiCreate(aeEventLoop *eventLoop) {
    aeApiState *state = dalloc(sizeof(aeApiState));

    if (!state) return -1;
    state->events = dalloc(sizeof(struct kevent)*eventLoop->setsize);
    if (!state->events) {
        dfree(state);
        return -1;
    }
    state->kqfd = kqueue();
    if (state->kqfd == -1) {
        dfree(state->events);
        dfree(state);
        return -1;
    }
    eventLoop->apidata = state;
    return 0;
}

static int aeApiResize(aeEventLoop *eventLoop, int setsize) {
    aeApiState *state = eventLoop->apidata;

    state->events = drealloc(state->events, sizeof(struct kevent)*setsize);
    return 0;
}

static void aeApiFree(aeEventLoop *eventLoop) {
    aeApiState *state = eventLoop->apidata;

    close(state->kqfd);
    dfree(state->events);
    dfree(state);
}

static int aeApiAddEvent(aeEventLoop *eventLoop, int fd, int mask) {
    aeApiState *state = eventLoop->apidata;
    struct kevent ke;

    if (mask & AE_READABLE) {
        EV_SET(&ke, fd, EVFILT_READ, EV_ADD, 0, 0, NULL);
        if (kevent(state->kqfd, &ke, 1, NULL, 0, NULL) == -1) return -1;
    }
    if (mask & AE_WRITABLE) {
        EV_SET(&ke, fd, EVFILT_WRITE, EV_ADD, 0, 0, NULL);
        if (kevent(state->kqfd, &ke, 1, NULL, 0, NULL) == -1) return -1;
    }
    return 0;
}

static void aeApiDelEvent(aeEventLoop *eventLoop, int fd, int mask) {
    aeApiState *state = eventLoop->apidata;
    struct kevent ke;

    if (mask & AE_READABLE) {
        EV_SET(&ke, fd, EVFILT_READ, EV_DELETE, 0, 0, NULL);
        kevent(state->kqfd, &ke, 1, NULL, 0, NULL);
    }
    if (mask & AE_WRITABLE) {
        EV_SET(&ke, fd, EVFILT_WRITE, EV_DELETE, 0, 0, NULL);
        kevent(state->kqfd, &ke, 1, NULL, 0, NULL);
    }
}

static int aeApiPoll(aeEventLoop *eventLoop, struct timeval *tvp) {
    aeApiState *state = eventLoop->apidata;
    int retval, numevents = 0;

    if (tvp != NULL) {
        struct timespec timeout;
        timeout.tv_sec = tvp->tv_sec;
        timeout.tv_nsec = tvp->tv_usec * 1000;
        retval = kevent(state->kqfd, NULL, 0, state->events, eventLoop->setsize,
                        &timeout);
    } else {
        retval = kevent(state->kqfd, NULL, 0, state->events, eventLoop->setsize,
                        NULL);
    }

    if (retval > 0) {
        int j;

        numevents = retval;
        for(j = 0; j < numevents; j++) {
            int mask = 0;
            struct kevent *e = state->events+j;

            if (e->filter == EVFILT_READ) mask |= AE_READABLE;
            if (e->filter == EVFILT_WRITE) mask |= AE_WRITABLE;
            eventLoop->fired[j].fd = e->ident;
            eventLoop->fired[j].mask = mask;
        }
    }
    return numevents;
}

static char *aeApiName(void) {
    return "kqueue";
}


================================================
FILE: dep/ae/ae_select.c
================================================
/* Select()-based ae.c module.
 *
 * Copyright (c) 2009-2012, Salvatore Sanfilippo <antirez at gmail dot com>
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */


#include <string.h>

typedef struct aeApiState {
    fd_set rfds, wfds;
    /* We need to have a copy of the fd sets as it's not safe to reuse
     * FD sets after select(). */
    fd_set _rfds, _wfds;
} aeApiState;

static int aeApiCreate(aeEventLoop *eventLoop) {
    aeApiState *state = dalloc(sizeof(aeApiState));

    if (!state) return -1;
    FD_ZERO(&state->rfds);
    FD_ZERO(&state->wfds);
    eventLoop->apidata = state;
    return 0;
}

static int aeApiResize(aeEventLoop *eventLoop, int setsize) {
    /* Just ensure we have enough room in the fd_set type. */
    if (setsize >= FD_SETSIZE) return -1;
    return 0;
}

static void aeApiFree(aeEventLoop *eventLoop) {
    dfree(eventLoop->apidata);
}

static int aeApiAddEvent(aeEventLoop *eventLoop, int fd, int mask) {
    aeApiState *state = eventLoop->apidata;

    if (mask & AE_READABLE) FD_SET(fd,&state->rfds);
    if (mask & AE_WRITABLE) FD_SET(fd,&state->wfds);
    return 0;
}

static void aeApiDelEvent(aeEventLoop *eventLoop, int fd, int mask) {
    aeApiState *state = eventLoop->apidata;

    if (mask & AE_READABLE) FD_CLR(fd,&state->rfds);
    if (mask & AE_WRITABLE) FD_CLR(fd,&state->wfds);
}

static int aeApiPoll(aeEventLoop *eventLoop, struct timeval *tvp) {
    aeApiState *state = eventLoop->apidata;
    int retval, j, numevents = 0;

    memcpy(&state->_rfds,&state->rfds,sizeof(fd_set));
    memcpy(&state->_wfds,&state->wfds,sizeof(fd_set));

    retval = select(eventLoop->maxfd+1,
                &state->_rfds,&state->_wfds,NULL,tvp);
    if (retval > 0) {
        for (j = 0; j <= eventLoop->maxfd; j++) {
            int mask = 0;
            aeFileEvent *fe = &eventLoop->events[j];

            if (fe->mask == AE_NONE) continue;
            if (fe->mask & AE_READABLE && FD_ISSET(j,&state->_rfds))
                mask |= AE_READABLE;
            if (fe->mask & AE_WRITABLE && FD_ISSET(j,&state->_wfds))
                mask |= AE_WRITABLE;
            eventLoop->fired[numevents].fd = j;
            eventLoop->fired[numevents].mask = mask;
            numevents++;
        }
    }
    return numevents;
}

static char *aeApiName(void) {
    return "select";
}


================================================
FILE: dep/darray/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CPPFLAGS =
if !OS_SOLARIS
AM_CPPFLAGS += -D_GNU_SOURCE
endif
AM_CPPFLAGS += -I $(top_srcdir)/dep/util
AM_CPPFLAGS += -I $(top_srcdir)/dep/jemalloc-4.2.0/include
AM_CPPFLAGS += -I $(top_srcdir)/dep/dmalloc

AM_CFLAGS = -Wall -Wshadow
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value

noinst_LIBRARIES = libdarray.a

noinst_HEADERS = darray.h

libdarray_a_SOURCES = \
	darray.c darray.h

================================================
FILE: dep/darray/darray.c
================================================
#include <stdlib.h>

#include <dmalloc.h>

#include <darray.h>

darray *
darray_create(unsigned long long n, size_t size)
{
    darray *a;

    a = dalloc(sizeof(*a));
    if (a == NULL) {
        return NULL;
    }

    a->elem = dalloc(n * size);
    if (a->elem == NULL) {
        dfree(a);
        return NULL;
    }

    a->nelem = 0;
    a->size = size;
    a->nalloc = n;

    return a;
}

void
darray_destroy(darray *a)
{
    darray_deinit(a);
    dfree(a);
}

int
darray_init(darray *a, unsigned long long n, size_t size)
{
    a->elem = dalloc(n * size);
    if (a->elem == NULL) {
        return -1;
    }

    a->nelem = 0;
    a->size = size;
    a->nalloc = n;

    return 0;
}

void
darray_deinit(darray *a)
{
    if (a->elem != NULL) {
        dfree(a->elem);
    }
}

unsigned long long
darray_idx(darray *a, void *elem)
{
    char *p, *q;
    unsigned long long off, idx;

    p = a->elem;
    q = elem;
    off = (unsigned long long)(q - p);

    idx = off / (unsigned long long)a->size;

    return idx;
}

void *
darray_push(darray *a)
{
    void *elem, *new;
    size_t size;

    if (a->nelem == a->nalloc) {

        /* the array is full; allocate new array */
        size = a->size * a->nalloc;
        new = drealloc(a->elem, 2 * size);
        if (new == NULL) {
            return NULL;
        }

        a->elem = new;
        a->nalloc *= 2;
    }

    elem = (char *)a->elem + a->size * a->nelem;
    a->nelem++;

    return elem;
}

void *
darray_pop(darray *a)
{
    void *elem;

    a->nelem--;
    elem = (char *)a->elem + a->size * a->nelem;

    return elem;
}

void *
darray_get(darray *a, unsigned long long idx)
{
    void *elem;

    elem = (char *)a->elem + (a->size * idx);

    return elem;
}

void *
darray_top(darray *a)
{
    return darray_get(a, a->nelem - 1);
}

void
darray_swap(darray *a, darray *b)
{
    darray tmp;

    tmp = *a;
    *a = *b;
    *b = tmp;
}

/*
 * Sort nelem elements of the array in ascending order based on the
 * compare comparator.
 */
void
darray_sort(darray *a, darray_compare_t compare)
{
    qsort(a->elem, a->nelem, a->size, compare);
}

/*
 * Calls the func once for each element in the array as long as func returns
 * success. On failure short-circuits and returns the error status.
 */
int
darray_each(darray *a, darray_each_t func, void *data)
{
    unsigned long long i, nelem;

    for (i = 0, nelem = darray_n(a); i < nelem; i++) {
        void *elem = darray_get(a, i);
        int ret;

        ret = func(elem, data);
        if (ret != 0) {
            return -1;
        }
    }

    return 0;
}


================================================
FILE: dep/darray/darray.h
================================================
#ifndef _DARRAY_H_
#define _DARRAY_H_

typedef int (*darray_compare_t)(const void *, const void *);
typedef int (*darray_each_t)(void *, void *);

typedef struct darray {
    unsigned long long   nelem;  /* # element */
    void                 *elem;  /* element */
    size_t               size;   /* element size */
    unsigned long long   nalloc; /* # allocated element */
} darray;

#define null_darray { 0, NULL, 0, 0 }

static inline void
darray_null(darray *a)
{
    a->nelem = 0;
    a->elem = NULL;
    a->size = 0;
    a->nalloc = 0;
}

static inline void
darray_set(darray *a, void *elem, size_t size, unsigned long long nalloc)
{
    a->nelem = 0;
    a->elem = elem;
    a->size = size;
    a->nalloc = nalloc;
}

static inline unsigned long long
darray_n(const darray *a)
{
    return a->nelem;
}

darray *darray_create(unsigned long long n, size_t size);
void darray_destroy(darray *a);
int darray_init(darray *a, unsigned long long n, size_t size);
void darray_deinit(darray *a);

unsigned long long darray_idx(darray *a, void *elem);
void *darray_push(darray *a);
void *darray_pop(darray *a);
void *darray_get(darray *a, unsigned long long idx);
void *darray_top(darray *a);
void darray_swap(darray *a, darray *b);
void darray_sort(darray *a, darray_compare_t compare);
int darray_each(darray *a, darray_each_t func, void *data);

#endif


================================================
FILE: dep/dhashkit/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CFLAGS = -Wall -Wshadow
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value

noinst_LIBRARIES = libdhashkit.a

noinst_HEADERS = dhashkit.h

libdhashkit_a_SOURCES =	\
	dhashkit.h		    \
	dcrc16.c			\
	dcrc32.c			\
	dfnv.c			    \
	dhsieh.c			\
	djenkins.c		    \
	dketama.c			\
	dmd5.c			    \
	dmodula.c			\
	dmurmur.c			\
	done_at_a_time.c	\
	drandom.c			\
	dsha1.c

================================================
FILE: dep/dhashkit/dcrc16.c
================================================
#include <dhashkit.h>

static const uint16_t crc16tab[256] = {
  0x0000, 0x1021, 0x2042, 0x3063, 0x4084, 0x50a5, 0x60c6, 0x70e7,
  0x8108, 0x9129, 0xa14a, 0xb16b, 0xc18c, 0xd1ad, 0xe1ce, 0xf1ef,
  0x1231, 0x0210, 0x3273, 0x2252, 0x52b5, 0x4294, 0x72f7, 0x62d6,
  0x9339, 0x8318, 0xb37b, 0xa35a, 0xd3bd, 0xc39c, 0xf3ff, 0xe3de,
  0x2462, 0x3443, 0x0420, 0x1401, 0x64e6, 0x74c7, 0x44a4, 0x5485,
  0xa56a, 0xb54b, 0x8528, 0x9509, 0xe5ee, 0xf5cf, 0xc5ac, 0xd58d,
  0x3653, 0x2672, 0x1611, 0x0630, 0x76d7, 0x66f6, 0x5695, 0x46b4,
  0xb75b, 0xa77a, 0x9719, 0x8738, 0xf7df, 0xe7fe, 0xd79d, 0xc7bc,
  0x48c4, 0x58e5, 0x6886, 0x78a7, 0x0840, 0x1861, 0x2802, 0x3823,
  0xc9cc, 0xd9ed, 0xe98e, 0xf9af, 0x8948, 0x9969, 0xa90a, 0xb92b,
  0x5af5, 0x4ad4, 0x7ab7, 0x6a96, 0x1a71, 0x0a50, 0x3a33, 0x2a12,
  0xdbfd, 0xcbdc, 0xfbbf, 0xeb9e, 0x9b79, 0x8b58, 0xbb3b, 0xab1a,
  0x6ca6, 0x7c87, 0x4ce4, 0x5cc5, 0x2c22, 0x3c03, 0x0c60, 0x1c41,
  0xedae, 0xfd8f, 0xcdec, 0xddcd, 0xad2a, 0xbd0b, 0x8d68, 0x9d49,
  0x7e97, 0x6eb6, 0x5ed5, 0x4ef4, 0x3e13, 0x2e32, 0x1e51, 0x0e70,
  0xff9f, 0xefbe, 0xdfdd, 0xcffc, 0xbf1b, 0xaf3a, 0x9f59, 0x8f78,
  0x9188, 0x81a9, 0xb1ca, 0xa1eb, 0xd10c, 0xc12d, 0xf14e, 0xe16f,
  0x1080, 0x00a1, 0x30c2, 0x20e3, 0x5004, 0x4025, 0x7046, 0x6067,
  0x83b9, 0x9398, 0xa3fb, 0xb3da, 0xc33d, 0xd31c, 0xe37f, 0xf35e,
  0x02b1, 0x1290, 0x22f3, 0x32d2, 0x4235, 0x5214, 0x6277, 0x7256,
  0xb5ea, 0xa5cb, 0x95a8, 0x8589, 0xf56e, 0xe54f, 0xd52c, 0xc50d,
  0x34e2, 0x24c3, 0x14a0, 0x0481, 0x7466, 0x6447, 0x5424, 0x4405,
  0xa7db, 0xb7fa, 0x8799, 0x97b8, 0xe75f, 0xf77e, 0xc71d, 0xd73c,
  0x26d3, 0x36f2, 0x0691, 0x16b0, 0x6657, 0x7676, 0x4615, 0x5634,
  0xd94c, 0xc96d, 0xf90e, 0xe92f, 0x99c8, 0x89e9, 0xb98a, 0xa9ab,
  0x5844, 0x4865, 0x7806, 0x6827, 0x18c0, 0x08e1, 0x3882, 0x28a3,
  0xcb7d, 0xdb5c, 0xeb3f, 0xfb1e, 0x8bf9, 0x9bd8, 0xabbb, 0xbb9a,
  0x4a75, 0x5a54, 0x6a37, 0x7a16, 0x0af1, 0x1ad0, 0x2ab3, 0x3a92,
  0xfd2e, 0xed0f, 0xdd6c, 0xcd4d, 0xbdaa, 0xad8b, 0x9de8, 0x8dc9,
  0x7c26, 0x6c07, 0x5c64, 0x4c45, 0x3ca2, 0x2c83, 0x1ce0, 0x0cc1,
  0xef1f, 0xff3e, 0xcf5d, 0xdf7c, 0xaf9b, 0xbfba, 0x8fd9, 0x9ff8,
  0x6e17, 0x7e36, 0x4e55, 0x5e74, 0x2e93, 0x3eb2, 0x0ed1, 0x1ef0,
};

uint32_t
hash_crc16(const char *key, size_t key_length)
{
    uint64_t x;
    uint32_t crc = 0;

    for (x=0; x < key_length; x++) {
        crc = (crc << 8) ^ crc16tab[((crc >> 8) ^ *key++) & 0x00ff];
    }

    return crc;
}


================================================
FILE: dep/dhashkit/dcrc32.c
================================================
#include <dhashkit.h>

static const uint32_t crc32tab[256] = {
    0x00000000, 0x77073096, 0xee0e612c, 0x990951ba,
    0x076dc419, 0x706af48f, 0xe963a535, 0x9e6495a3,
    0x0edb8832, 0x79dcb8a4, 0xe0d5e91e, 0x97d2d988,
    0x09b64c2b, 0x7eb17cbd, 0xe7b82d07, 0x90bf1d91,
    0x1db71064, 0x6ab020f2, 0xf3b97148, 0x84be41de,
    0x1adad47d, 0x6ddde4eb, 0xf4d4b551, 0x83d385c7,
    0x136c9856, 0x646ba8c0, 0xfd62f97a, 0x8a65c9ec,
    0x14015c4f, 0x63066cd9, 0xfa0f3d63, 0x8d080df5,
    0x3b6e20c8, 0x4c69105e, 0xd56041e4, 0xa2677172,
    0x3c03e4d1, 0x4b04d447, 0xd20d85fd, 0xa50ab56b,
    0x35b5a8fa, 0x42b2986c, 0xdbbbc9d6, 0xacbcf940,
    0x32d86ce3, 0x45df5c75, 0xdcd60dcf, 0xabd13d59,
    0x26d930ac, 0x51de003a, 0xc8d75180, 0xbfd06116,
    0x21b4f4b5, 0x56b3c423, 0xcfba9599, 0xb8bda50f,
    0x2802b89e, 0x5f058808, 0xc60cd9b2, 0xb10be924,
    0x2f6f7c87, 0x58684c11, 0xc1611dab, 0xb6662d3d,
    0x76dc4190, 0x01db7106, 0x98d220bc, 0xefd5102a,
    0x71b18589, 0x06b6b51f, 0x9fbfe4a5, 0xe8b8d433,
    0x7807c9a2, 0x0f00f934, 0x9609a88e, 0xe10e9818,
    0x7f6a0dbb, 0x086d3d2d, 0x91646c97, 0xe6635c01,
    0x6b6b51f4, 0x1c6c6162, 0x856530d8, 0xf262004e,
    0x6c0695ed, 0x1b01a57b, 0x8208f4c1, 0xf50fc457,
    0x65b0d9c6, 0x12b7e950, 0x8bbeb8ea, 0xfcb9887c,
    0x62dd1ddf, 0x15da2d49, 0x8cd37cf3, 0xfbd44c65,
    0x4db26158, 0x3ab551ce, 0xa3bc0074, 0xd4bb30e2,
    0x4adfa541, 0x3dd895d7, 0xa4d1c46d, 0xd3d6f4fb,
    0x4369e96a, 0x346ed9fc, 0xad678846, 0xda60b8d0,
    0x44042d73, 0x33031de5, 0xaa0a4c5f, 0xdd0d7cc9,
    0x5005713c, 0x270241aa, 0xbe0b1010, 0xc90c2086,
    0x5768b525, 0x206f85b3, 0xb966d409, 0xce61e49f,
    0x5edef90e, 0x29d9c998, 0xb0d09822, 0xc7d7a8b4,
    0x59b33d17, 0x2eb40d81, 0xb7bd5c3b, 0xc0ba6cad,
    0xedb88320, 0x9abfb3b6, 0x03b6e20c, 0x74b1d29a,
    0xead54739, 0x9dd277af, 0x04db2615, 0x73dc1683,
    0xe3630b12, 0x94643b84, 0x0d6d6a3e, 0x7a6a5aa8,
    0xe40ecf0b, 0x9309ff9d, 0x0a00ae27, 0x7d079eb1,
    0xf00f9344, 0x8708a3d2, 0x1e01f268, 0x6906c2fe,
    0xf762575d, 0x806567cb, 0x196c3671, 0x6e6b06e7,
    0xfed41b76, 0x89d32be0, 0x10da7a5a, 0x67dd4acc,
    0xf9b9df6f, 0x8ebeeff9, 0x17b7be43, 0x60b08ed5,
    0xd6d6a3e8, 0xa1d1937e, 0x38d8c2c4, 0x4fdff252,
    0xd1bb67f1, 0xa6bc5767, 0x3fb506dd, 0x48b2364b,
    0xd80d2bda, 0xaf0a1b4c, 0x36034af6, 0x41047a60,
    0xdf60efc3, 0xa867df55, 0x316e8eef, 0x4669be79,
    0xcb61b38c, 0xbc66831a, 0x256fd2a0, 0x5268e236,
    0xcc0c7795, 0xbb0b4703, 0x220216b9, 0x5505262f,
    0xc5ba3bbe, 0xb2bd0b28, 0x2bb45a92, 0x5cb36a04,
    0xc2d7ffa7, 0xb5d0cf31, 0x2cd99e8b, 0x5bdeae1d,
    0x9b64c2b0, 0xec63f226, 0x756aa39c, 0x026d930a,
    0x9c0906a9, 0xeb0e363f, 0x72076785, 0x05005713,
    0x95bf4a82, 0xe2b87a14, 0x7bb12bae, 0x0cb61b38,
    0x92d28e9b, 0xe5d5be0d, 0x7cdcefb7, 0x0bdbdf21,
    0x86d3d2d4, 0xf1d4e242, 0x68ddb3f8, 0x1fda836e,
    0x81be16cd, 0xf6b9265b, 0x6fb077e1, 0x18b74777,
    0x88085ae6, 0xff0f6a70, 0x66063bca, 0x11010b5c,
    0x8f659eff, 0xf862ae69, 0x616bffd3, 0x166ccf45,
    0xa00ae278, 0xd70dd2ee, 0x4e048354, 0x3903b3c2,
    0xa7672661, 0xd06016f7, 0x4969474d, 0x3e6e77db,
    0xaed16a4a, 0xd9d65adc, 0x40df0b66, 0x37d83bf0,
    0xa9bcae53, 0xdebb9ec5, 0x47b2cf7f, 0x30b5ffe9,
    0xbdbdf21c, 0xcabac28a, 0x53b39330, 0x24b4a3a6,
    0xbad03605, 0xcdd70693, 0x54de5729, 0x23d967bf,
    0xb3667a2e, 0xc4614ab8, 0x5d681b02, 0x2a6f2b94,
    0xb40bbe37, 0xc30c8ea1, 0x5a05df1b, 0x2d02ef8d,
};

/*
 * CRC-32 implementation compatible with libmemcached library. Unfortunately
 * this implementation does not return CRC-32 as per spec.
 */
uint32_t
hash_crc32(const char *key, size_t key_length)
{
    uint64_t x;
    uint32_t crc = UINT32_MAX;

    for (x = 0; x < key_length; x++) {
        crc = (crc >> 8) ^ crc32tab[(crc ^ (uint64_t)key[x]) & 0xff];
    }

    return ((~crc) >> 16) & 0x7fff;
}

uint32_t
hash_crc32a(const char *key, size_t key_length)
{
    const uint8_t *p = key;
    uint32_t crc;

    crc = ~0U;
    while (key_length--) {
        crc = crc32tab[(crc ^ *p++) & 0xFF] ^ (crc >> 8);
    }

    return crc ^ ~0U;
}


================================================
FILE: dep/dhashkit/dfnv.c
================================================
#include <dhashkit.h>

static uint64_t FNV_64_INIT = UINT64_C(0xcbf29ce484222325);
static uint64_t FNV_64_PRIME = UINT64_C(0x100000001b3);
static uint32_t FNV_32_INIT = 2166136261UL;
static uint32_t FNV_32_PRIME = 16777619;

uint32_t
hash_fnv1_64(const char *key, size_t key_length)
{
    uint64_t hash = FNV_64_INIT;
    size_t x;

    for (x = 0; x < key_length; x++) {
      hash *= FNV_64_PRIME;
      hash ^= (uint64_t)key[x];
    }

    return (uint32_t)hash;
}

uint32_t
hash_fnv1a_64(const char *key, size_t key_length)
{
    uint32_t hash = (uint32_t) FNV_64_INIT;
    size_t x;

    for (x = 0; x < key_length; x++) {
      uint32_t val = (uint32_t)key[x];
      hash ^= val;
      hash *= (uint32_t) FNV_64_PRIME;
    }

    return hash;
}

uint32_t
hash_fnv1_32(const char *key, size_t key_length)
{
    uint32_t hash = FNV_32_INIT;
    size_t x;

    for (x = 0; x < key_length; x++) {
      uint32_t val = (uint32_t)key[x];
      hash *= FNV_32_PRIME;
      hash ^= val;
    }

    return hash;
}

uint32_t
hash_fnv1a_32(const char *key, size_t key_length)
{
    uint32_t hash = FNV_32_INIT;
    size_t x;

    for (x= 0; x < key_length; x++) {
      uint32_t val = (uint32_t)key[x];
      hash ^= val;
      hash *= FNV_32_PRIME;
    }

    return hash;
}


================================================
FILE: dep/dhashkit/dhashkit.h
================================================
#ifndef _DHASHKIT_H_
#define _DHASHKIT_H_

#include <stdint.h>
#include <stdio.h>

#include <sys/types.h>

struct continuum {
    uint32_t index;  /* server index */
    uint32_t value;  /* hash value */
};

#define HASH_CODEC(ACTION)                      \
    ACTION( HASH_ONE_AT_A_TIME, one_at_a_time ) \
    ACTION( HASH_MD5,           md5           ) \
    ACTION( HASH_CRC16,         crc16         ) \
    ACTION( HASH_CRC32,         crc32         ) \
    ACTION( HASH_CRC32A,        crc32a        ) \
    ACTION( HASH_FNV1_64,       fnv1_64       ) \
    ACTION( HASH_FNV1A_64,      fnv1a_64      ) \
    ACTION( HASH_FNV1_32,       fnv1_32       ) \
    ACTION( HASH_FNV1A_32,      fnv1a_32      ) \
    ACTION( HASH_HSIEH,         hsieh         ) \
    ACTION( HASH_MURMUR,        murmur        ) \
    ACTION( HASH_JENKINS,       jenkins       ) \

#define DIST_CODEC(ACTION)                      \
    ACTION( DIST_KETAMA,        ketama        ) \
    ACTION( DIST_MODULA,        modula        ) \
    ACTION( DIST_RANDOM,        random        ) \

#define DEFINE_ACTION(_hash, _name) _hash,
typedef enum hash_type {
    HASH_CODEC( DEFINE_ACTION )
    HASH_SENTINEL
} hash_type_t;
#undef DEFINE_ACTION

#define DEFINE_ACTION(_dist, _name) _dist,
typedef enum dist_type {
    DIST_CODEC( DEFINE_ACTION )
    DIST_SENTINEL
} dist_type_t;
#undef DEFINE_ACTION

uint32_t hash_one_at_a_time(const char *key, size_t key_length);
void md5_signature(const unsigned char *key, unsigned long length, unsigned char *result);
uint32_t hash_md5(const char *key, size_t key_length);
uint32_t hash_crc16(const char *key, size_t key_length);
uint32_t hash_crc32(const char *key, size_t key_length);
uint32_t hash_crc32a(const char *key, size_t key_length);
uint32_t hash_fnv1_64(const char *key, size_t key_length);
uint32_t hash_fnv1a_64(const char *key, size_t key_length);
uint32_t hash_fnv1_32(const char *key, size_t key_length);
uint32_t hash_fnv1a_32(const char *key, size_t key_length);
uint32_t hash_hsieh(const char *key, size_t key_length);
uint32_t hash_jenkins(const char *key, size_t length);
uint32_t hash_murmur(const char *key, size_t length);

uint32_t ketama_dispatch(struct continuum *continuum, uint32_t ncontinuum, uint32_t hash);
uint32_t modula_dispatch(struct continuum *continuum, uint32_t ncontinuum, uint32_t hash);
uint32_t random_dispatch(struct continuum *continuum, uint32_t ncontinuum, uint32_t hash);


/*SHA-1 in CBy Steve Reid <steve@edmweb.com>100% Public Domain*/
typedef struct {
    uint32_t state[5];    
    uint32_t count[2];    
    unsigned char buffer[64];
} SHA1_CTX;

void SHA1Transform(uint32_t state[5], const unsigned char buffer[64]);
void SHA1Init(SHA1_CTX* context);
void SHA1Update(SHA1_CTX* context, const unsigned char* data, uint32_t len);
void SHA1Final(unsigned char digest[20], SHA1_CTX* context);

#endif


================================================
FILE: dep/dhashkit/dhsieh.c
================================================
#include <dhashkit.h>

#undef get16bits
#if (defined(__GNUC__) && defined(__i386__))
#define get16bits(d) (*((const uint16_t *) (d)))
#endif

#if !defined (get16bits)
#define get16bits(d) ((((uint32_t)(((const uint8_t *)(d))[1])) << 8)\
                      +(uint32_t)(((const uint8_t *)(d))[0]) )
#endif

uint32_t
hash_hsieh(const char *key, size_t key_length)
{
    uint32_t hash = 0, tmp;
    int rem;

    if (key_length <= 0 || key == NULL) {
        return 0;
    }

    rem = key_length & 3;
    key_length >>= 2;

    /* Main loop */
    for (;key_length > 0; key_length--) {
        hash += get16bits (key);
        tmp = (get16bits (key+2) << 11) ^ hash;
        hash = (hash << 16) ^ tmp;
        key += 2*sizeof (uint16_t);
        hash += hash >> 11;
    }

    /* Handle end cases */
    switch (rem) {
    case 3:
        hash += get16bits (key);
        hash ^= hash << 16;
        hash ^= (uint32_t)key[sizeof (uint16_t)] << 18;
        hash += hash >> 11;
        break;

    case 2:
        hash += get16bits (key);
        hash ^= hash << 11;
        hash += hash >> 17;
        break;

    case 1:
        hash += (unsigned char)(*key);
        hash ^= hash << 10;
        hash += hash >> 1;

    default:
        break;
    }

    /* Force "avalanching" of final 127 bits */
    hash ^= hash << 3;
    hash += hash >> 5;
    hash ^= hash << 4;
    hash += hash >> 17;
    hash ^= hash << 25;
    hash += hash >> 6;

    return hash;
}


================================================
FILE: dep/dhashkit/djenkins.c
================================================
#include <dhashkit.h>

#define hashsize(n) ((uint32_t)1<<(n))
#define hashmask(n) (hashsize(n)-1)
#define rot(x,k) (((x)<<(k)) | ((x)>>(32-(k))))

#define mix(a,b,c) \
{ \
  a -= c;  a ^= rot(c, 4);  c += b; \
  b -= a;  b ^= rot(a, 6);  a += c; \
  c -= b;  c ^= rot(b, 8);  b += a; \
  a -= c;  a ^= rot(c,16);  c += b; \
  b -= a;  b ^= rot(a,19);  a += c; \
  c -= b;  c ^= rot(b, 4);  b += a; \
}

#define final(a,b,c) \
{ \
  c ^= b; c -= rot(b,14); \
  a ^= c; a -= rot(c,11); \
  b ^= a; b -= rot(a,25); \
  c ^= b; c -= rot(b,16); \
  a ^= c; a -= rot(c,4);  \
  b ^= a; b -= rot(a,14); \
  c ^= b; c -= rot(b,24); \
}

#define JENKINS_INITVAL 13

/*
 * jenkins_hash() -- hash a variable-length key into a 32-bit value
 *  k       : the key (the unaligned variable-length array of bytes)
 *  length  : the length of the key, counting by bytes
 *  initval : can be any 4-byte value
 * Returns a 32-bit value.  Every bit of the key affects every bit of
 * the return value.  Two keys differing by one or two bits will have
 * totally different hash values.

 * The best hash table sizes are powers of 2.  There is no need to do
 * mod a prime (mod is sooo slow!).  If you need less than 32 bits,
 * use a bitmask.  For example, if you need only 10 bits, do
 *   h = (h & hashmask(10));
 * In which case, the hash table should have hashsize(10) elements.
 */

uint32_t
hash_jenkins(const char *key, size_t length)
{
  uint32_t a,b,c;                                          /* internal state */
  union { const void *ptr; size_t i; } u;     /* needed for Mac Powerbook G4 */

  /* Set up the internal state */
  a = b = c = 0xdeadbeef + ((uint32_t)length) + JENKINS_INITVAL;

  u.ptr = key;
#ifndef WORDS_BIGENDIAN
  if ((u.i & 0x3) == 0)
  {
    const uint32_t *k = (const uint32_t *)key;         /* read 32-bit chunks */

    /*------ all but last block: aligned reads and affect 32 bits of (a,b,c) */
    while (length > 12)
    {
      a += k[0];
      b += k[1];
      c += k[2];
      mix(a,b,c);
      length -= 12;
      k += 3;
    }

    /*----------------------------- handle the last (probably partial) block */
    /*
     * "k[2]&0xffffff" actually reads beyond the end of the string, but
     * then masks off the part it's not allowed to read.  Because the
     * string is aligned, the masked-off tail is in the same word as the
     * rest of the string.  Every machine with memory protection I've seen
     * does it on word boundaries, so is OK with this.  But VALGRIND will
     * still catch it and complain.  The masking trick does make the hash
     * noticeably faster for short strings (like English words).
     */
    switch(length)
    {
    case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
    case 11: c+=k[2]&0xffffff; b+=k[1]; a+=k[0]; break;
    case 10: c+=k[2]&0xffff; b+=k[1]; a+=k[0]; break;
    case 9 : c+=k[2]&0xff; b+=k[1]; a+=k[0]; break;
    case 8 : b+=k[1]; a+=k[0]; break;
    case 7 : b+=k[1]&0xffffff; a+=k[0]; break;
    case 6 : b+=k[1]&0xffff; a+=k[0]; break;
    case 5 : b+=k[1]&0xff; a+=k[0]; break;
    case 4 : a+=k[0]; break;
    case 3 : a+=k[0]&0xffffff; break;
    case 2 : a+=k[0]&0xffff; break;
    case 1 : a+=k[0]&0xff; break;
    case 0 : return c;              /* zero length strings require no mixing */
    default: return c;
    }

  }
  else if ((u.i & 0x1) == 0)
  {
    const uint16_t *k = (const uint16_t *)key;         /* read 16-bit chunks */
    const uint8_t  *k8;

    /*--------------- all but last block: aligned reads and different mixing */
    while (length > 12)
    {
      a += k[0] + (((uint32_t)k[1])<<16);
      b += k[2] + (((uint32_t)k[3])<<16);
      c += k[4] + (((uint32_t)k[5])<<16);
      mix(a,b,c);
      length -= 12;
      k += 6;
    }

    /*----------------------------- handle the last (probably partial) block */
    k8 = (const uint8_t *)k;
    switch(length)
    {
    case 12: c+=k[4]+(((uint32_t)k[5])<<16);
             b+=k[2]+(((uint32_t)k[3])<<16);
             a+=k[0]+(((uint32_t)k[1])<<16);
             break;
    case 11: c+=((uint32_t)k8[10])<<16;     /* fall through */
    case 10: c+=k[4];
             b+=k[2]+(((uint32_t)k[3])<<16);
             a+=k[0]+(((uint32_t)k[1])<<16);
             break;
    case 9 : c+=k8[8];                      /* fall through */
    case 8 : b+=k[2]+(((uint32_t)k[3])<<16);
             a+=k[0]+(((uint32_t)k[1])<<16);
             break;
    case 7 : b+=((uint32_t)k8[6])<<16;      /* fall through */
    case 6 : b+=k[2];
             a+=k[0]+(((uint32_t)k[1])<<16);
             break;
    case 5 : b+=k8[4];                      /* fall through */
    case 4 : a+=k[0]+(((uint32_t)k[1])<<16);
             break;
    case 3 : a+=((uint32_t)k8[2])<<16;      /* fall through */
    case 2 : a+=k[0];
             break;
    case 1 : a+=k8[0];
             break;
    case 0 : return c;                     /* zero length requires no mixing */
    default: return c;
    }

  }
  else
  {                        /* need to read the key one byte at a time */
#endif /* little endian */
    const uint8_t *k = (const uint8_t *)key;

    /*--------------- all but the last block: affect some 32 bits of (a,b,c) */
    while (length > 12)
    {
      a += k[0];
      a += ((uint32_t)k[1])<<8;
      a += ((uint32_t)k[2])<<16;
      a += ((uint32_t)k[3])<<24;
      b += k[4];
      b += ((uint32_t)k[5])<<8;
      b += ((uint32_t)k[6])<<16;
      b += ((uint32_t)k[7])<<24;
      c += k[8];
      c += ((uint32_t)k[9])<<8;
      c += ((uint32_t)k[10])<<16;
      c += ((uint32_t)k[11])<<24;
      mix(a,b,c);
      length -= 12;
      k += 12;
    }

    /*-------------------------------- last block: affect all 32 bits of (c) */
    switch(length)                   /* all the case statements fall through */
    {
    case 12: c+=((uint32_t)k[11])<<24;
    case 11: c+=((uint32_t)k[10])<<16;
    case 10: c+=((uint32_t)k[9])<<8;
    case 9 : c+=k[8];
    case 8 : b+=((uint32_t)k[7])<<24;
    case 7 : b+=((uint32_t)k[6])<<16;
    case 6 : b+=((uint32_t)k[5])<<8;
    case 5 : b+=k[4];
    case 4 : a+=((uint32_t)k[3])<<24;
    case 3 : a+=((uint32_t)k[2])<<16;
    case 2 : a+=((uint32_t)k[1])<<8;
    case 1 : a+=k[0];
             break;
    case 0 : return c;
    default : return c;
    }
#ifndef WORDS_BIGENDIAN
  }
#endif

  final(a,b,c);
  return c;
}


================================================
FILE: dep/dhashkit/dketama.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <math.h>

#include <dhashkit.h>

#define KETAMA_CONTINUUM_ADDITION   10  /* # extra slots to build into continuum */
#define KETAMA_POINTS_PER_SERVER    160 /* 40 points per hash */
#define KETAMA_MAX_HOSTLEN          86

static uint32_t
ketama_hash(const char *key, size_t key_length, uint32_t alignment)
{
    unsigned char results[16];

    md5_signature((const unsigned char*)key, (unsigned long)key_length, results);

    return ((uint32_t) (results[3 + alignment * 4] & 0xFF) << 24)
        | ((uint32_t) (results[2 + alignment * 4] & 0xFF) << 16)
        | ((uint32_t) (results[1 + alignment * 4] & 0xFF) << 8)
        | (results[0 + alignment * 4] & 0xFF);
}

static int
ketama_item_cmp(const void *t1, const void *t2)
{
    const struct continuum *ct1 = t1, *ct2 = t2;

    if (ct1->value == ct2->value) {
        return 0;
    } else if (ct1->value > ct2->value) {
        return 1;
    } else {
        return -1;
    }
}

uint32_t
ketama_dispatch(struct continuum *continuum, uint32_t ncontinuum, uint32_t hash)
{
    struct continuum *begin, *end, *left, *right, *middle;

    ASSERT(continuum != NULL);
    ASSERT(ncontinuum != 0);

    begin = left = continuum;
    end = right = continuum + ncontinuum;

    while (left < right) {
        middle = left + (right - left) / 2;
        if (middle->value < hash) {
          left = middle + 1;
        } else {
          right = middle;
        }
    }

    if (right == end) {
        right = begin;
    }

    return right->index;
}


================================================
FILE: dep/dhashkit/dmd5.c
================================================
#include <string.h>

#include <dhashkit.h>

/*
 * This is an OpenSSL-compatible implementation of the RSA Data Security, Inc.
 * MD5 Message-Digest Algorithm (RFC 1321).
 *
 * Homepage: http://openwall.info/wiki/people/solar/software/public-domain-source-code/md5
 *
 * Author: Alexander Peslyak, better known as Solar Designer <solar at openwall.com>
 */

typedef unsigned int MD5_u32plus;

typedef struct {
    MD5_u32plus lo, hi;
    MD5_u32plus a, b, c, d;
    unsigned char buffer[64];
    MD5_u32plus block[16];
} MD5_CTX;

/*
 * The basic MD5 functions.
 *
 * F and G are optimized compared to their RFC 1321 definitions for
 * architectures that lack an AND-NOT instruction, just like in Colin Plumb's
 * implementation.
 */
#define F(x, y, z)			((z) ^ ((x) & ((y) ^ (z))))
#define G(x, y, z)			((y) ^ ((z) & ((x) ^ (y))))
#define H(x, y, z)			((x) ^ (y) ^ (z))
#define I(x, y, z)			((y) ^ ((x) | ~(z)))

/*
 * The MD5 transformation for all four rounds.
 */
#define STEP(f, a, b, c, d, x, t, s)                            \
	(a) += f((b), (c), (d)) + (x) + (t);                        \
	(a) = (((a) << (s)) | (((a) & 0xffffffff) >> (32 - (s))));  \
	(a) += (b);

/*
 * SET reads 4 input bytes in little-endian byte order and stores them
 * in a properly aligned word in host byte order.
 *
 * The check for little-endian architectures that tolerate unaligned
 * memory accesses is just an optimization.  Nothing will break if it
 * doesn't work.
 */
#if defined(__i386__) || defined(__x86_64__) || defined(__vax__)
#define SET(n) \
    (*(MD5_u32plus *)&ptr[(n) * 4])
#define GET(n) \
    SET(n)
#else
#define SET(n)                                  \
    (ctx->block[(n)] =                          \
    (MD5_u32plus)ptr[(n) * 4] |                 \
    ((MD5_u32plus)ptr[(n) * 4 + 1] << 8) |      \
    ((MD5_u32plus)ptr[(n) * 4 + 2] << 16) |     \
    ((MD5_u32plus)ptr[(n) * 4 + 3] << 24))
#define GET(n) \
    (ctx->block[(n)])
#endif

/*
 * This processes one or more 64-byte data blocks, but does NOT update
 * the bit counters.  There are no alignment requirements.
 */
static void *
body(MD5_CTX *ctx, void *data, unsigned long size)
{
    unsigned char *ptr;
    MD5_u32plus a, b, c, d;
    MD5_u32plus saved_a, saved_b, saved_c, saved_d;

    ptr = data;

    a = ctx->a;
    b = ctx->b;
    c = ctx->c;
    d = ctx->d;

	do {
        saved_a = a;
        saved_b = b;
        saved_c = c;
        saved_d = d;

        /* Round 1 */
        STEP(F, a, b, c, d, SET(0), 0xd76aa478, 7)
        STEP(F, d, a, b, c, SET(1), 0xe8c7b756, 12)
        STEP(F, c, d, a, b, SET(2), 0x242070db, 17)
        STEP(F, b, c, d, a, SET(3), 0xc1bdceee, 22)
        STEP(F, a, b, c, d, SET(4), 0xf57c0faf, 7)
        STEP(F, d, a, b, c, SET(5), 0x4787c62a, 12)
        STEP(F, c, d, a, b, SET(6), 0xa8304613, 17)
        STEP(F, b, c, d, a, SET(7), 0xfd469501, 22)
        STEP(F, a, b, c, d, SET(8), 0x698098d8, 7)
        STEP(F, d, a, b, c, SET(9), 0x8b44f7af, 12)
        STEP(F, c, d, a, b, SET(10), 0xffff5bb1, 17)
        STEP(F, b, c, d, a, SET(11), 0x895cd7be, 22)
        STEP(F, a, b, c, d, SET(12), 0x6b901122, 7)
        STEP(F, d, a, b, c, SET(13), 0xfd987193, 12)
        STEP(F, c, d, a, b, SET(14), 0xa679438e, 17)
        STEP(F, b, c, d, a, SET(15), 0x49b40821, 22)

        /* Round 2 */
        STEP(G, a, b, c, d, GET(1), 0xf61e2562, 5)
        STEP(G, d, a, b, c, GET(6), 0xc040b340, 9)
        STEP(G, c, d, a, b, GET(11), 0x265e5a51, 14)
        STEP(G, b, c, d, a, GET(0), 0xe9b6c7aa, 20)
        STEP(G, a, b, c, d, GET(5), 0xd62f105d, 5)
        STEP(G, d, a, b, c, GET(10), 0x02441453, 9)
        STEP(G, c, d, a, b, GET(15), 0xd8a1e681, 14)
        STEP(G, b, c, d, a, GET(4), 0xe7d3fbc8, 20)
        STEP(G, a, b, c, d, GET(9), 0x21e1cde6, 5)
        STEP(G, d, a, b, c, GET(14), 0xc33707d6, 9)
        STEP(G, c, d, a, b, GET(3), 0xf4d50d87, 14)
        STEP(G, b, c, d, a, GET(8), 0x455a14ed, 20)
        STEP(G, a, b, c, d, GET(13), 0xa9e3e905, 5)
        STEP(G, d, a, b, c, GET(2), 0xfcefa3f8, 9)
        STEP(G, c, d, a, b, GET(7), 0x676f02d9, 14)
        STEP(G, b, c, d, a, GET(12), 0x8d2a4c8a, 20)

        /* Round 3 */
        STEP(H, a, b, c, d, GET(5), 0xfffa3942, 4)
        STEP(H, d, a, b, c, GET(8), 0x8771f681, 11)
        STEP(H, c, d, a, b, GET(11), 0x6d9d6122, 16)
        STEP(H, b, c, d, a, GET(14), 0xfde5380c, 23)
        STEP(H, a, b, c, d, GET(1), 0xa4beea44, 4)
        STEP(H, d, a, b, c, GET(4), 0x4bdecfa9, 11)
        STEP(H, c, d, a, b, GET(7), 0xf6bb4b60, 16)
        STEP(H, b, c, d, a, GET(10), 0xbebfbc70, 23)
        STEP(H, a, b, c, d, GET(13), 0x289b7ec6, 4)
        STEP(H, d, a, b, c, GET(0), 0xeaa127fa, 11)
        STEP(H, c, d, a, b, GET(3), 0xd4ef3085, 16)
        STEP(H, b, c, d, a, GET(6), 0x04881d05, 23)
        STEP(H, a, b, c, d, GET(9), 0xd9d4d039, 4)
        STEP(H, d, a, b, c, GET(12), 0xe6db99e5, 11)
        STEP(H, c, d, a, b, GET(15), 0x1fa27cf8, 16)
        STEP(H, b, c, d, a, GET(2), 0xc4ac5665, 23)

        /* Round 4 */
        STEP(I, a, b, c, d, GET(0), 0xf4292244, 6)
        STEP(I, d, a, b, c, GET(7), 0x432aff97, 10)
        STEP(I, c, d, a, b, GET(14), 0xab9423a7, 15)
        STEP(I, b, c, d, a, GET(5), 0xfc93a039, 21)
        STEP(I, a, b, c, d, GET(12), 0x655b59c3, 6)
        STEP(I, d, a, b, c, GET(3), 0x8f0ccc92, 10)
        STEP(I, c, d, a, b, GET(10), 0xffeff47d, 15)
        STEP(I, b, c, d, a, GET(1), 0x85845dd1, 21)
        STEP(I, a, b, c, d, GET(8), 0x6fa87e4f, 6)
        STEP(I, d, a, b, c, GET(15), 0xfe2ce6e0, 10)
        STEP(I, c, d, a, b, GET(6), 0xa3014314, 15)
        STEP(I, b, c, d, a, GET(13), 0x4e0811a1, 21)
        STEP(I, a, b, c, d, GET(4), 0xf7537e82, 6)
        STEP(I, d, a, b, c, GET(11), 0xbd3af235, 10)
        STEP(I, c, d, a, b, GET(2), 0x2ad7d2bb, 15)
        STEP(I, b, c, d, a, GET(9), 0xeb86d391, 21)

        a += saved_a;
        b += saved_b;
        c += saved_c;
        d += saved_d;

        ptr += 64;
    } while (size -= 64);

    ctx->a = a;
    ctx->b = b;
    ctx->c = c;
    ctx->d = d;

    return ptr;
}

void
MD5_Init(MD5_CTX *ctx)
{
    ctx->a = 0x67452301;
    ctx->b = 0xefcdab89;
    ctx->c = 0x98badcfe;
    ctx->d = 0x10325476;

    ctx->lo = 0;
    ctx->hi = 0;
}

void
MD5_Update(MD5_CTX *ctx, void *data, unsigned long size)
{
    MD5_u32plus saved_lo;
    unsigned long used, free;

    saved_lo = ctx->lo;
    if ((ctx->lo = (saved_lo + size) & 0x1fffffff) < saved_lo) {
        ctx->hi++;
    }
    ctx->hi += size >> 29;

    used = saved_lo & 0x3f;

    if (used) {
        free = 64 - used;

        if (size < free) {
            memcpy(&ctx->buffer[used], data, size);
            return;
        }

        memcpy(&ctx->buffer[used], data, free);
        data = (unsigned char *)data + free;
        size -= free;
        body(ctx, ctx->buffer, 64);
    }

    if (size >= 64) {
        data = body(ctx, data, size & ~(unsigned long)0x3f);
        size &= 0x3f;
    }

    memcpy(ctx->buffer, data, size);
}

void
MD5_Final(unsigned char *result, MD5_CTX *ctx)
{
    unsigned long used, free;

    used = ctx->lo & 0x3f;

    ctx->buffer[used++] = 0x80;

    free = 64 - used;

    if (free < 8) {
        memset(&ctx->buffer[used], 0, free);
        body(ctx, ctx->buffer, 64);
        used = 0;
        free = 64;
    }

    memset(&ctx->buffer[used], 0, free - 8);

    ctx->lo <<= 3;
    ctx->buffer[56] = ctx->lo;
    ctx->buffer[57] = ctx->lo >> 8;
    ctx->buffer[58] = ctx->lo >> 16;
    ctx->buffer[59] = ctx->lo >> 24;
    ctx->buffer[60] = ctx->hi;
    ctx->buffer[61] = ctx->hi >> 8;
    ctx->buffer[62] = ctx->hi >> 16;
    ctx->buffer[63] = ctx->hi >> 24;

    body(ctx, ctx->buffer, 64);

    result[0] = ctx->a;
    result[1] = ctx->a >> 8;
    result[2] = ctx->a >> 16;
    result[3] = ctx->a >> 24;
    result[4] = ctx->b;
    result[5] = ctx->b >> 8;
    result[6] = ctx->b >> 16;
    result[7] = ctx->b >> 24;
    result[8] = ctx->c;
    result[9] = ctx->c >> 8;
    result[10] = ctx->c >> 16;
    result[11] = ctx->c >> 24;
    result[12] = ctx->d;
    result[13] = ctx->d >> 8;
    result[14] = ctx->d >> 16;
    result[15] = ctx->d >> 24;

    memset(ctx, 0, sizeof(*ctx));
}

/*
 * Just a simple method for getting the signature
 * result must be == 16
 */
void
md5_signature(const unsigned char *key, unsigned long length, unsigned char *result)
{
    MD5_CTX my_md5;

    MD5_Init(&my_md5);
    (void)MD5_Update(&my_md5, key, length);
    MD5_Final(result, &my_md5);
}

uint32_t
hash_md5(const char *key, size_t key_length)
{
    unsigned char results[16];

    md5_signature((const unsigned char*)key, (unsigned long)key_length, results);

    return ((uint32_t) (results[3] & 0xFF) << 24) |
           ((uint32_t) (results[2] & 0xFF) << 16) |
           ((uint32_t) (results[1] & 0xFF) << 8) |
           (results[0] & 0xFF);
}


================================================
FILE: dep/dhashkit/dmodula.c
================================================
#include <stdio.h>
#include <stdlib.h>

#include <dhashkit.h>

#define MODULA_CONTINUUM_ADDITION   10  /* # extra slots to build into continuum */
#define MODULA_POINTS_PER_SERVER    1

uint32_t
modula_dispatch(struct continuum *continuum, uint32_t ncontinuum, uint32_t hash)
{
    struct continuum *c;

    ASSERT(continuum != NULL);
    ASSERT(ncontinuum != 0);

    c = continuum + hash % ncontinuum;

    return c->index;
}


================================================
FILE: dep/dhashkit/dmurmur.c
================================================
/*
 * "Murmur" hash provided by Austin, tanjent@gmail.com
 * http://murmurhash.googlepages.com/
 *
 * Note - This code makes a few assumptions about how your machine behaves -
 *
 * 1. We can read a 4-byte value from any address without crashing
 * 2. sizeof(int) == 4
 *
 * And it has a few limitations -
 * 1. It will not work incrementally.
 * 2. It will not produce the same results on little-endian and big-endian
 *  machines.
 *
 *  Updated to murmur2 hash - BP
 */

#include <dhashkit.h>

uint32_t
hash_murmur(const char *key, size_t length)
{
    /*
     * 'm' and 'r' are mixing constants generated offline.  They're not
     * really 'magic', they just happen to work well.
     */

    const unsigned int m = 0x5bd1e995;
    const uint32_t seed = (0xdeadbeef * (uint32_t)length);
    const int r = 24;


    /* Initialize the hash to a 'random' value */

    uint32_t h = seed ^ (uint32_t)length;

    /* Mix 4 bytes at a time into the hash */

    const unsigned char * data = (const unsigned char *)key;

    while (length >= 4) {
        unsigned int k = *(unsigned int *)data;

        k *= m;
        k ^= k >> r;
        k *= m;

        h *= m;
        h ^= k;

        data += 4;
        length -= 4;
    }

    /* Handle the last few bytes of the input array */

    switch(length) {
    case 3:
        h ^= ((uint32_t)data[2]) << 16;

    case 2:
        h ^= ((uint32_t)data[1]) << 8;

    case 1:
        h ^= data[0];
        h *= m;

    default:
        break;
    };

    /*
     * Do a few final mixes of the hash to ensure the last few bytes are
     * well-incorporated.
     */

    h ^= h >> 13;
    h *= m;
    h ^= h >> 15;

    return h;
}


================================================
FILE: dep/dhashkit/done_at_a_time.c
================================================
/*
 * HashKit
 * Copyright (C) 2009 Brian Aker
 * All rights reserved.
 *
 * Use and distribution licensed under the BSD license.  See
 * the COPYING file in the parent directory for full text.
 */

/*
 * This has is Jenkin's "One at A time Hash".
 * http://en.wikipedia.org/wiki/Jenkins_hash_function
 */

#include <dhashkit.h>

uint32_t
hash_one_at_a_time(const char *key, size_t key_length)
{
    const char *ptr = key;
    uint32_t value = 0;

    while (key_length--) {
        uint32_t val = (uint32_t) *ptr++;
        value += val;
        value += (value << 10);
        value ^= (value >> 6);
    }
    value += (value << 3);
    value ^= (value >> 11);
    value += (value << 15);

    return value;
}


================================================
FILE: dep/dhashkit/drandom.c
================================================
#include <stdio.h>
#include <stdlib.h>

#include <dhashkit.h>

#define RANDOM_CONTINUUM_ADDITION   10  /* # extra slots to build into continuum */
#define RANDOM_POINTS_PER_SERVER    1

uint32_t
random_dispatch(struct continuum *continuum, uint32_t ncontinuum, uint32_t hash)
{
    struct continuum *c;

    ASSERT(continuum != NULL);
    ASSERT(ncontinuum != 0);

    c = continuum + random() % ncontinuum;

    return c->index;
}


================================================
FILE: dep/dhashkit/dsha1.c
================================================

/* from valgrind tests */

/* ================ sha1.c ================ */
/*
SHA-1 in C
By Steve Reid <steve@edmweb.com>
100% Public Domain

Test Vectors (from FIPS PUB 180-1)
"abc"
  A9993E36 4706816A BA3E2571 7850C26C 9CD0D89D
"abcdbcdecdefdefgefghfghighijhijkijkljklmklmnlmnomnopnopq"
  84983E44 1C3BD26E BAAE4AA1 F95129E5 E54670F1
A million repetitions of "a"
  34AA973C D4C4DAA4 F61EEB2B DBAD2731 6534016F
*/

/* #define LITTLE_ENDIAN * This should be #define'd already, if true. */
/* #define SHA1HANDSOFF * Copies data before messing with it. */

#define SHA1HANDSOFF

#include <stdio.h>
#include <string.h>
#include <stdint.h>

#include <dhashkit.h>

#define rol(value, bits) (((value) << (bits)) | ((value) >> (32 - (bits))))

/* blk0() and blk() perform the initial expand. */
/* I got the idea of expanding during the round function from SSLeay */
#ifdef VR_LITTLE_ENDIAN
#define blk0(i) (block->l[i] = (rol(block->l[i],24)&0xFF00FF00) \
    |(rol(block->l[i],8)&0x00FF00FF))
#else
#define blk0(i) block->l[i]
#endif
#define blk(i) (block->l[i&15] = rol(block->l[(i+13)&15]^block->l[(i+8)&15] \
    ^block->l[(i+2)&15]^block->l[i&15],1))

/* (R0+R1), R2, R3, R4 are the different operations used in SHA1 */
#define R0(v,w,x,y,z,i) z+=((w&(x^y))^y)+blk0(i)+0x5A827999+rol(v,5);w=rol(w,30);
#define R1(v,w,x,y,z,i) z+=((w&(x^y))^y)+blk(i)+0x5A827999+rol(v,5);w=rol(w,30);
#define R2(v,w,x,y,z,i) z+=(w^x^y)+blk(i)+0x6ED9EBA1+rol(v,5);w=rol(w,30);
#define R3(v,w,x,y,z,i) z+=(((w|x)&y)|(w&x))+blk(i)+0x8F1BBCDC+rol(v,5);w=rol(w,30);
#define R4(v,w,x,y,z,i) z+=(w^x^y)+blk(i)+0xCA62C1D6+rol(v,5);w=rol(w,30);


/* Hash a single 512-bit block. This is the core of the algorithm. */

void SHA1Transform(uint32_t state[5], const unsigned char buffer[64])
{
    uint32_t a, b, c, d, e;
    typedef union {
        unsigned char c[64];
        uint32_t l[16];
    } CHAR64LONG16;
#ifdef SHA1HANDSOFF
    CHAR64LONG16 block[1];  /* use array to appear as a pointer */
    memcpy(block, buffer, 64);
#else
    /* The following had better never be used because it causes the
     * pointer-to-const buffer to be cast into a pointer to non-const.
     * And the result is written through.  I threw a "const" in, hoping
     * this will cause a diagnostic.
     */
    CHAR64LONG16* block = (const CHAR64LONG16*)buffer;
#endif
    /* Copy context->state[] to working vars */
    a = state[0];
    b = state[1];
    c = state[2];
    d = state[3];
    e = state[4];
    /* 4 rounds of 20 operations each. Loop unrolled. */
    R0(a,b,c,d,e, 0); R0(e,a,b,c,d, 1); R0(d,e,a,b,c, 2); R0(c,d,e,a,b, 3);
    R0(b,c,d,e,a, 4); R0(a,b,c,d,e, 5); R0(e,a,b,c,d, 6); R0(d,e,a,b,c, 7);
    R0(c,d,e,a,b, 8); R0(b,c,d,e,a, 9); R0(a,b,c,d,e,10); R0(e,a,b,c,d,11);
    R0(d,e,a,b,c,12); R0(c,d,e,a,b,13); R0(b,c,d,e,a,14); R0(a,b,c,d,e,15);
    R1(e,a,b,c,d,16); R1(d,e,a,b,c,17); R1(c,d,e,a,b,18); R1(b,c,d,e,a,19);
    R2(a,b,c,d,e,20); R2(e,a,b,c,d,21); R2(d,e,a,b,c,22); R2(c,d,e,a,b,23);
    R2(b,c,d,e,a,24); R2(a,b,c,d,e,25); R2(e,a,b,c,d,26); R2(d,e,a,b,c,27);
    R2(c,d,e,a,b,28); R2(b,c,d,e,a,29); R2(a,b,c,d,e,30); R2(e,a,b,c,d,31);
    R2(d,e,a,b,c,32); R2(c,d,e,a,b,33); R2(b,c,d,e,a,34); R2(a,b,c,d,e,35);
    R2(e,a,b,c,d,36); R2(d,e,a,b,c,37); R2(c,d,e,a,b,38); R2(b,c,d,e,a,39);
    R3(a,b,c,d,e,40); R3(e,a,b,c,d,41); R3(d,e,a,b,c,42); R3(c,d,e,a,b,43);
    R3(b,c,d,e,a,44); R3(a,b,c,d,e,45); R3(e,a,b,c,d,46); R3(d,e,a,b,c,47);
    R3(c,d,e,a,b,48); R3(b,c,d,e,a,49); R3(a,b,c,d,e,50); R3(e,a,b,c,d,51);
    R3(d,e,a,b,c,52); R3(c,d,e,a,b,53); R3(b,c,d,e,a,54); R3(a,b,c,d,e,55);
    R3(e,a,b,c,d,56); R3(d,e,a,b,c,57); R3(c,d,e,a,b,58); R3(b,c,d,e,a,59);
    R4(a,b,c,d,e,60); R4(e,a,b,c,d,61); R4(d,e,a,b,c,62); R4(c,d,e,a,b,63);
    R4(b,c,d,e,a,64); R4(a,b,c,d,e,65); R4(e,a,b,c,d,66); R4(d,e,a,b,c,67);
    R4(c,d,e,a,b,68); R4(b,c,d,e,a,69); R4(a,b,c,d,e,70); R4(e,a,b,c,d,71);
    R4(d,e,a,b,c,72); R4(c,d,e,a,b,73); R4(b,c,d,e,a,74); R4(a,b,c,d,e,75);
    R4(e,a,b,c,d,76); R4(d,e,a,b,c,77); R4(c,d,e,a,b,78); R4(b,c,d,e,a,79);
    /* Add the working vars back into context.state[] */
    state[0] += a;
    state[1] += b;
    state[2] += c;
    state[3] += d;
    state[4] += e;
    /* Wipe variables */
    a = b = c = d = e = 0;
#ifdef SHA1HANDSOFF
    memset(block, '\0', sizeof(block));
#endif
}


/* SHA1Init - Initialize new context */

void SHA1Init(SHA1_CTX* context)
{
    /* SHA1 initialization constants */
    context->state[0] = 0x67452301;
    context->state[1] = 0xEFCDAB89;
    context->state[2] = 0x98BADCFE;
    context->state[3] = 0x10325476;
    context->state[4] = 0xC3D2E1F0;
    context->count[0] = context->count[1] = 0;
}


/* Run your data through this. */

void SHA1Update(SHA1_CTX* context, const unsigned char* data, uint32_t len)
{
    uint32_t i, j;

    j = context->count[0];
    if ((context->count[0] += len << 3) < j)
        context->count[1]++;
    context->count[1] += (len>>29);
    j = (j >> 3) & 63;
    if ((j + len) > 63) {
        memcpy(&context->buffer[j], data, (i = 64-j));
        SHA1Transform(context->state, context->buffer);
        for ( ; i + 63 < len; i += 64) {
            SHA1Transform(context->state, &data[i]);
        }
        j = 0;
    }
    else i = 0;
    memcpy(&context->buffer[j], &data[i], len - i);
}


/* Add padding and return the message digest. */

void SHA1Final(unsigned char digest[20], SHA1_CTX* context)
{
    unsigned i;
    unsigned char finalcount[8];
    unsigned char c;

#if 0	/* untested "improvement" by DHR */
    /* Convert context->count to a sequence of bytes
     * in finalcount.  Second element first, but
     * big-endian order within element.
     * But we do it all backwards.
     */
    unsigned char *fcp = &finalcount[8];

    for (i = 0; i < 2; i++)
       {
        uint32_t t = context->count[i];
        int j;

        for (j = 0; j < 4; t >>= 8, j++)
	          *--fcp = (unsigned char) t;
    }
#else
    for (i = 0; i < 8; i++) {
        finalcount[i] = (unsigned char)((context->count[(i >= 4 ? 0 : 1)]
         >> ((3-(i & 3)) * 8) ) & 255);  /* Endian independent */
    }
#endif
    c = 0200;
    SHA1Update(context, &c, 1);
    while ((context->count[0] & 504) != 448) {
	c = 0000;
        SHA1Update(context, &c, 1);
    }
    SHA1Update(context, finalcount, 8);  /* Should cause a SHA1Transform() */
    for (i = 0; i < 20; i++) {
        digest[i] = (unsigned char)
         ((context->state[i>>2] >> ((3-(i & 3)) * 8) ) & 255);
    }
    /* Wipe variables */
    memset(context, '\0', sizeof(*context));
    memset(&finalcount, '\0', sizeof(finalcount));
}
/* ================ end of sha1.c ================ */


================================================
FILE: dep/dlist/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CPPFLAGS =
if !OS_SOLARIS
AM_CPPFLAGS += -D_GNU_SOURCE
endif
AM_CPPFLAGS += -I $(top_srcdir)/dep/util
AM_CPPFLAGS += -I $(top_srcdir)/dep/jemalloc-4.2.0/include
AM_CPPFLAGS += -I $(top_srcdir)/dep/dmalloc

AM_CFLAGS = -Wall -Wshadow
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value

noinst_LIBRARIES = libdlist.a

noinst_HEADERS = dlist.h dmtqueue.h dlockqueue.h

libdlist_a_SOURCES =	            \
	dlist.c dlist.h                 \
    dmtqueue.c dmtqueue.h           \
    dlockqueue.c dlockqueue.h

================================================
FILE: dep/dlist/dlist.c
================================================
#include <stdlib.h>

#include <dmalloc.h>

#include <dlist.h>

/* Create a new list. The created list can be freed with
 * AlFreeList(), but private value of every node need to be freed
 * by the user before to call AlFreeList().
 *
 * On error, NULL is returned. Otherwise the pointer to the new list. */
dlist *dlistCreate(void)
{
    struct dlist *list;

    if ((list = dalloc(sizeof(*list))) == NULL)
        return NULL;
    list->head = list->tail = NULL;
    list->len = 0;
    list->dup = NULL;
    list->free = NULL;
    list->match = NULL;
    return list;
}

/* Free the whole list.
 *
 * This function can't fail. */
void dlistRelease(dlist *list)
{
    unsigned long len;
    dlistNode *current, *next;

    current = list->head;
    len = list->len;
    while(len--) {
        next = current->next;
        if (list->free) list->free(current->value);
        dfree(current);
        current = next;
    }
    dfree(list);
}

/* Add a new node to the list, to head, containing the specified 'value'
 * pointer as value.
 *
 * On error, NULL is returned and no operation is performed (i.e. the
 * list remains unaltered).
 * On success the 'list' pointer you pass to the function is returned. */
dlist *dlistAddNodeHead(dlist *list, void *value)
{
    dlistNode *node;

    if ((node = dalloc(sizeof(*node))) == NULL)
        return NULL;
    node->value = value;
    if (list->len == 0) {
        list->head = list->tail = node;
        node->prev = node->next = NULL;
    } else {
        node->prev = NULL;
        node->next = list->head;
        list->head->prev = node;
        list->head = node;
    }
    list->len++;
    return list;
}

/* Add a new node to the list, to tail, containing the specified 'value'
 * pointer as value.
 *
 * On error, NULL is returned and no operation is performed (i.e. the
 * list remains unaltered).
 * On success the 'list' pointer you pass to the function is returned. */
dlist *dlistAddNodeTail(dlist *list, void *value)
{
    dlistNode *node;

    if ((node = dalloc(sizeof(*node))) == NULL)
        return NULL;
    node->value = value;
    if (list->len == 0) {
        list->head = list->tail = node;
        node->prev = node->next = NULL;
    } else {
        node->prev = list->tail;
        node->next = NULL;
        list->tail->next = node;
        list->tail = node;
    }
    list->len++;
    return list;
}

dlist *dlistInsertNode(dlist *list, dlistNode *old_node, void *value, int after) {
    dlistNode *node;

    if ((node = dalloc(sizeof(*node))) == NULL)
        return NULL;
    node->value = value;
    if (after) {
        node->prev = old_node;
        node->next = old_node->next;
        if (list->tail == old_node) {
            list->tail = node;
        }
    } else {
        node->next = old_node;
        node->prev = old_node->prev;
        if (list->head == old_node) {
            list->head = node;
        }
    }
    if (node->prev != NULL) {
        node->prev->next = node;
    }
    if (node->next != NULL) {
        node->next->prev = node;
    }
    list->len++;
    return list;
}

/* Remove the specified node from the specified list.
 * It's up to the caller to free the private value of the node.
 *
 * This function can't fail. */
void dlistDelNode(dlist *list, dlistNode *node)
{
    if (node->prev)
        node->prev->next = node->next;
    else
        list->head = node->next;
    if (node->next)
        node->next->prev = node->prev;
    else
        list->tail = node->prev;
    if (list->free) list->free(node->value);
    dfree(node);
    list->len--;
}

/* Returns a list iterator 'iter'. After the initialization every
 * call to dlistNext() will return the next element of the list.
 *
 * This function can't fail. */
dlistIter *dlistGetIterator(dlist *list, int direction)
{
    dlistIter *iter;

    if ((iter = dalloc(sizeof(*iter))) == NULL) return NULL;
    if (direction == AL_START_HEAD)
        iter->next = list->head;
    else
        iter->next = list->tail;
    iter->direction = direction;
    return iter;
}

/* Release the iterator memory */
void dlistReleaseIterator(dlistIter *iter) {
    dfree(iter);
}

/* Create an iterator in the list private iterator structure */
void dlistRewind(dlist *list, dlistIter *li) {
    li->next = list->head;
    li->direction = AL_START_HEAD;
}

void dlistRewindTail(dlist *list, dlistIter *li) {
    li->next = list->tail;
    li->direction = AL_START_TAIL;
}

/* Return the next element of an iterator.
 * It's valid to remove the currently returned element using
 * dlistDelNode(), but not to remove other elements.
 *
 * The function returns a pointer to the next element of the list,
 * or NULL if there are no more elements, so the classical usage patter
 * is:
 *
 * iter = dlistGetIterator(list,<direction>);
 * while ((node = dlistNext(iter)) != NULL) {
 *     doSomethingWith(dlistNodeValue(node));
 * }
 *
 * */
dlistNode *dlistNext(dlistIter *iter)
{
    dlistNode *current = iter->next;

    if (current != NULL) {
        if (iter->direction == AL_START_HEAD)
            iter->next = current->next;
        else
            iter->next = current->prev;
    }
    return current;
}

/* Duplicate the whole list. On out of memory NULL is returned.
 * On success a copy of the original list is returned.
 *
 * The 'Dup' method set with listSetDupMethod() function is used
 * to copy the node value. Otherwise the same pointer value of
 * the original node is used as value of the copied node.
 *
 * The original list both on success or error is never modified. */
dlist *dlistDup(dlist *orig)
{
    dlist *copy;
    dlistIter iter;
    dlistNode *node;

    if ((copy = dlistCreate()) == NULL)
        return NULL;
    copy->dup = orig->dup;
    copy->free = orig->free;
    copy->match = orig->match;
    dlistRewind(orig, &iter);
    while((node = dlistNext(&iter)) != NULL) {
        void *value;

        if (copy->dup) {
            value = copy->dup(node->value);
            if (value == NULL) {
                dlistRelease(copy);
                return NULL;
            }
        } else
            value = node->value;
        if (dlistAddNodeTail(copy, value) == NULL) {
            dlistRelease(copy);
            return NULL;
        }
    }
    return copy;
}

/* Search the list for a node matching a given key.
 * The match is performed using the 'match' method
 * set with listSetMatchMethod(). If no 'match' method
 * is set, the 'value' pointer of every node is directly
 * compared with the 'key' pointer.
 *
 * On success the first matching node pointer is returned
 * (search starts from head). If no matching node exists
 * NULL is returned. */
dlistNode *dlistSearchKey(dlist *list, void *key)
{
    dlistIter iter;
    dlistNode *node;

    dlistRewind(list, &iter);
    while((node = dlistNext(&iter)) != NULL) {
        if (list->match) {
            if (list->match(node->value, key)) {
                return node;
            }
        } else {
            if (key == node->value) {
                return node;
            }
        }
    }
    return NULL;
}

/* Return the element at the specified zero-based index
 * where 0 is the head, 1 is the element next to head
 * and so on. Negative integers are used in order to count
 * from the tail, -1 is the last element, -2 the penultimate
 * and so on. If the index is out of range NULL is returned. */
dlistNode *dlistIndex(dlist *list, long index) {
    dlistNode *n;

    if (index < 0) {
        index = (-index)-1;
        n = list->tail;
        while(index-- && n) n = n->prev;
    } else {
        n = list->head;
        while(index-- && n) n = n->next;
    }
    return n;
}

/* Rotate the list removing the tail node and inserting it to the head. */
void dlistRotate(dlist *list) {
    dlistNode *tail = list->tail;

    if (dlistLength(list) <= 1) return;

    /* Detach current tail */
    list->tail = tail->prev;
    list->tail->next = NULL;
    /* Move it as head */
    list->head->prev = tail;
    tail->prev = NULL;
    tail->next = list->head;
    list->head = tail;
}

dlist *dlistPush(dlist *list, void *value) {
    dlistAddNodeTail(list, value);
    return list;
}

void *dlistPop(dlist *list) {
    dlistNode *node;
    void *value;
    
    node = dlistFirst(list);
    if (node == NULL) {
        return NULL;
    }

    value = dlistNodeValue(node);
    dlistDelNode(list, node);

    if (list->free) return NULL;
    
    return value;
}


================================================
FILE: dep/dlist/dlist.h
================================================
#ifndef _DLIST_H__
#define _DLIST_H__

/* Node, List, and Iterator are the only data structures used currently. */

typedef struct dlistNode {
    struct dlistNode *prev;
    struct dlistNode *next;
    void *value;
} dlistNode;

typedef struct dlistIter {
    dlistNode *next;
    int direction;
} dlistIter;

typedef struct dlist {
    dlistNode *head;
    dlistNode *tail;
    void *(*dup)(void *ptr);
    void (*free)(void *ptr);
    int (*match)(void *ptr, void *key);
    unsigned long len;
} dlist;

/* Functions implemented as macros */
#define dlistLength(l) ((l)->len)
#define dlistFirst(l) ((l)->head)
#define dlistLast(l) ((l)->tail)
#define dlistPrevNode(n) ((n)->prev)
#define dlistNextNode(n) ((n)->next)
#define dlistNodeValue(n) ((n)->value)

#define dlistSetDupMethod(l,m) ((l)->dup = (m))
#define dlistSetFreeMethod(l,m) ((l)->free = (m))
#define dlistSetMatchMethod(l,m) ((l)->match = (m))

#define dlistGetDupMethod(l) ((l)->dup)
#define dlistGetFree(l) ((l)->free)
#define dlistGetMatchMethod(l) ((l)->match)

/* Prototypes */
dlist *dlistCreate(void);
void dlistRelease(dlist *list);
dlist *dlistAddNodeHead(dlist *list, void *value);
dlist *dlistAddNodeTail(dlist *list, void *value);
dlist *dlistInsertNode(dlist *list, dlistNode *old_node, void *value, int after);
void dlistDelNode(dlist *list, dlistNode *node);
dlistIter *dlistGetIterator(dlist *list, int direction);
dlistNode *dlistNext(dlistIter *iter);
void dlistReleaseIterator(dlistIter *iter);
dlist *dlistDup(dlist *orig);
dlistNode *dlistSearchKey(dlist *list, void *key);
dlistNode *dlistIndex(dlist *list, long index);
void dlistRewind(dlist *list, dlistIter *li);
void dlistRewindTail(dlist *list, dlistIter *li);
void dlistRotate(dlist *list);
dlist *dlistPush(dlist *list, void *value);
void *dlistPop(dlist *list);

/* Directions for iterators */
#define AL_START_HEAD 0
#define AL_START_TAIL 1

#endif /* __ADLIST_H__ */


================================================
FILE: dep/dlist/dlockqueue.c
================================================
#include <pthread.h>
#include <stdlib.h>
#include <stdio.h>

#include <dmalloc.h>

#include <dlist.h>
#include <dmtqueue.h>
#include <dlockqueue.h>

dlockqueue *dlockqueue_create(void)
{
    dlockqueue *lqueue;

    lqueue = dalloc(sizeof(*lqueue));
    if (lqueue == NULL) {
        return NULL;
    }

    lqueue->maxlen = -1;
    lqueue->maxlen_policy = MAX_LENGTH_POLICY_REJECT;
    pthread_mutex_init(&lqueue->lmutex,NULL);
    
    lqueue->l = dlistCreate();
    if (lqueue->l == NULL) {
        dlockqueue_destroy(lqueue);
        return NULL;
    }

    return lqueue;
}

long long dlockqueue_push(void *q, void *value)
{
    dlockqueue *lqueue = q;
    dlist *list;
    long long length;
    
    pthread_mutex_lock(&lqueue->lmutex);
    length = (long long)dlistLength(lqueue->l);
    if (lqueue->maxlen >0 && length >= lqueue->maxlen) {
        if (lqueue->maxlen_policy == MAX_LENGTH_POLICY_REJECT) {
            length = -1;
        } else if (lqueue->maxlen_policy == MAX_LENGTH_POLICY_EVICT_HEAD) {
            while (length >= lqueue->maxlen) {
                dlistNode *ln = dlistFirst(lqueue->l);
                dlistDelNode(lqueue->l,ln);
                length = (long long)dlistLength(lqueue->l);
            }
            list = dlistAddNodeTail(lqueue->l, value);
            length ++;
        } else if (lqueue->maxlen_policy == MAX_LENGTH_POLICY_EVICT_END) {
            while (length >= lqueue->maxlen) {
                dlistNode *ln = dlistLast(lqueue->l);
                dlistDelNode(lqueue->l,ln);
                length = (long long)dlistLength(lqueue->l);
            }
            list = dlistAddNodeTail(lqueue->l, value);
            length ++;
        }
    } else {
        list = dlistAddNodeTail(lqueue->l, value);
        length ++;
    }
    pthread_mutex_unlock(&lqueue->lmutex);

    if (list == NULL) {
        return -1;
    }

    return length;
}

void *dlockqueue_pop(void *q)
{
    dlockqueue *lqueue = q;
    dlistNode *node;
    void *value;
        
    if (lqueue == NULL || lqueue->l == NULL) {
        return NULL;
    }
    
    pthread_mutex_lock(&lqueue->lmutex);
    
    node = dlistFirst(lqueue->l);
    if (node == NULL) {
        pthread_mutex_unlock(&lqueue->lmutex);
        return NULL;
    }

    value = dlistNodeValue(node);

    dlistDelNode(lqueue->l, node);

    pthread_mutex_unlock(&lqueue->lmutex);

    return value;
}

void dlockqueue_destroy(void *q)
{
    dlockqueue *lqueue = q;
    if (lqueue == NULL) {
        return;
    }

    if (lqueue->l != NULL) {
        dlistRelease(lqueue->l);
    }

    pthread_mutex_destroy(&lqueue->lmutex);

    dfree(lqueue);
}

long long dlockqueue_length(void *q)
{
    dlockqueue *lqueue = q;
    long long length;
    
    if (lqueue == NULL || lqueue->l == NULL) {
        return -1;
    }

    pthread_mutex_lock(&lqueue->lmutex);
    length = dlistLength(lqueue->l);
    pthread_mutex_unlock(&lqueue->lmutex);
    
    return length;
}


================================================
FILE: dep/dlist/dlockqueue.h
================================================
#ifndef _DLOCKQUEUE_H_
#define _DLOCKQUEUE_H_

struct dlist;

typedef struct dlockqueue{
    struct dlist *l;
    long long maxlen;
    int maxlen_policy;
    pthread_mutex_t lmutex;
} dlockqueue;

dlockqueue *dlockqueue_create(void);
long long dlockqueue_push(void *q, void *value);
void *dlockqueue_pop(void *q);
void dlockqueue_destroy(void *q);
long long dlockqueue_length(void *q);

#endif


================================================
FILE: dep/dlist/dmtqueue.c
================================================
#include <stdlib.h>

#include <dmalloc.h>

#include <dlist.h>
#include <dmtqueue.h>
#include <dlockqueue.h>

/******** multi-thread safe queue interface ********/
dmtqueue *dmtqueue_create(void)
{
    dmtqueue *q;

    q = dalloc(sizeof(*q));
    if (q == NULL) {
        return NULL;
    }

    q->l = NULL;
    q->lock_push = NULL;
    q->lock_pop = NULL;
    q->destroy = NULL;
    q->length = NULL;
    
    return q;
}

void dmtqueue_destroy(dmtqueue *q)
{
    if (q == NULL) {
        return;
    }

    if (q->destroy) {
        q->destroy(q->l);
    }

    dfree(q);
}

long long dmtqueue_push(dmtqueue *q, void *value)
{
    if(q == NULL || q->l == NULL
        || q->lock_push == NULL)
    {
        return -1;
    }

    return q->lock_push(q->l, value);
}

void *dmtqueue_pop(dmtqueue *q)
{
    if(q == NULL || q->l == NULL
        || q->lock_pop == NULL)
    {
        return NULL;
    }
    
    return q->lock_pop(q->l);
}

int dmtqueue_empty(dmtqueue *q)
{
    if(q == NULL || q->l == NULL
        || q->length == NULL)
    {
        return -1;
    }

    if(q->length(q->l) > 0)
    {
        return 0;
    }

    return 1;
}

long long dmtqueue_length(dmtqueue *q)
{
    if(q == NULL || q->l == NULL
        || q->length == NULL)
    {
        return -1;
    }

    return q->length(q->l);
}

/******** multi-thread safe queue implement ********/

/**
* This is multi-thread safe queue.
* This lock list's performance is not good, but it is safe.
*/
int dmtqueue_init_with_lockqueue(dmtqueue *q, dlockqueue_freefunc freefunc)
{
    dlockqueue *lq;
    
    if (q == NULL) {
        return -1;
    }

    lq = dlockqueue_create();
    if (lq == NULL) {
        return -1;
    }

    lq->l->free = freefunc;

    q->l = lq;
    q->lock_push = dlockqueue_push;
    q->lock_pop = dlockqueue_pop;
    q->destroy = dlockqueue_destroy;
    q->length = dlockqueue_length;
    
    return 0;
}


================================================
FILE: dep/dlist/dmtqueue.h
================================================
#ifndef _DMTQUEUE_H_
#define _DMTQUEUE_H_

#define MAX_LENGTH_POLICY_REJECT        0
#define MAX_LENGTH_POLICY_EVICT_HEAD    1
#define MAX_LENGTH_POLICY_EVICT_END     2

/* Multi-thread safe queue */
typedef struct dmtqueue{
    void *l;
    long long (*lock_push)(void *q, void *value);
    void *(*lock_pop)(void *q);
    void (*destroy)(void *q);
    long long (*length)(void *q);
} dmtqueue;

#define dmtqueueSetMaxlength(q,l)        ((q)->l->maxlen = (l))
#define dmtqueueSetMaxlengthPolicy(q,p)  ((q)->l->maxlen = (p))

typedef int (*dmtqueue_init)(dmtqueue *);

/******** multi-thread safe list interface ********/

dmtqueue *dmtqueue_create(void);
void dmtqueue_destroy(dmtqueue *q);
long long dmtqueue_push(dmtqueue *q, void *value);
void *dmtqueue_pop(dmtqueue *q);
int dmtqueue_empty(dmtqueue *q);
long long dmtqueue_length(dmtqueue *q);

/******** multi-thread safe list implement ********/

typedef void (*dlockqueue_freefunc)(void *);
int dmtqueue_init_with_lockqueue(dmtqueue *l, dlockqueue_freefunc freefunc);

#endif


================================================
FILE: dep/dmalloc/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CPPFLAGS =
if !OS_SOLARIS
AM_CPPFLAGS += -D_GNU_SOURCE
endif
AM_CPPFLAGS += -I $(top_srcdir)/dep/jemalloc-4.2.0/include
AM_CPPFLAGS += -I $(top_srcdir)/dep/util

AM_CFLAGS = -Wall -Wshadow
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value

noinst_LIBRARIES = libdmalloc.a

noinst_HEADERS = dmalloc.h

libdmalloc_a_SOURCES =      \
	dmalloc.c dmalloc.h

================================================
FILE: dep/dmalloc/dmalloc.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <pthread.h>

#include <unistd.h>

#include <dutil.h>
#include <dlog.h>

#include <dmalloc.h>

/*memory api*/
static size_t used_memory = 0;
pthread_mutex_t used_memory_mutex = PTHREAD_MUTEX_INITIALIZER;

#if defined(__ATOMIC_RELAXED)
#define update_used_mem_stat_add(__n) __atomic_add_fetch(&used_memory, (__n), __ATOMIC_RELAXED)
#define update_used_mem_stat_sub(__n) __atomic_sub_fetch(&used_memory, (__n), __ATOMIC_RELAXED)
char *malloc_lock_type(void) {return "__ATOMIC_RELAXED";}
#elif defined(HAVE_ATOMIC)
#define update_used_mem_stat_add(__n) __sync_add_and_fetch(&used_memory, (__n))
#define update_used_mem_stat_sub(__n) __sync_sub_and_fetch(&used_memory, (__n))
char *malloc_lock_type(void) {return "HAVE_ATOMIC";}
#else
#define update_used_mem_stat_add(__n) do {      \
    pthread_mutex_lock(&used_memory_mutex);     \
    used_memory += (__n); \
    pthread_mutex_unlock(&used_memory_mutex);   \
} while(0)

#define update_used_mem_stat_sub(__n) do {      \
    pthread_mutex_lock(&used_memory_mutex);     \
    used_memory -= (__n); \
    pthread_mutex_unlock(&used_memory_mutex);   \
} while(0)

char *malloc_lock_type(void) {return "pthread_mutex_t";}
#endif

#define update_dmalloc_stat_alloc(__n) do {                                 \
    size_t _n = (__n);                                                      \
    if (_n&(sizeof(long)-1)) _n += sizeof(long)-(_n&(sizeof(long)-1));    \
    update_used_mem_stat_add(_n);                                           \
} while(0)

#define update_dmalloc_stat_free(__n) do {                                  \
    size_t _n = (__n);                                                      \
    if (_n&(sizeof(long)-1)) _n += sizeof(long)-(_n&(sizeof(long)-1));    \
    update_used_mem_stat_sub(_n);                                           \
} while(0)

#ifdef HAVE_MALLOC_SIZE
#define PREFIX_SIZE (0)
#else
#if defined(__sun) || defined(__sparc) || defined(__sparc__)
#define PREFIX_SIZE (sizeof(long long))
#else
#define PREFIX_SIZE (sizeof(size_t))
#endif
#endif

/* Provide dmalloc_size() for systems where this function is not provided by
 * malloc itself, given that in that case we store a header with this
 * information as the first bytes of every allocation. */
#ifndef HAVE_MALLOC_SIZE
size_t dmalloc_size(void *ptr) {
    void *realptr = (char*)ptr-PREFIX_SIZE;
    size_t size = *((size_t*)realptr);
    /* Assume at least that all the allocations are padded at sizeof(long) by
     * the underlying allocator. */
    if (size&(sizeof(long)-1)) size += sizeof(long)-(size&(sizeof(long)-1));
    return size+PREFIX_SIZE;
}
#endif

void *
_dalloc(size_t size, const char *name, int line)
{
    void *p;

    ASSERT(size != 0);

#ifdef DUSE_JEMALLOC
    p = je_malloc(size+PREFIX_SIZE);
#else
    p = malloc(size+PREFIX_SIZE);
#endif
    if (p == NULL) {
        log_error("malloc(%zu) failed @ %s:%d", size, name, line);
    } else {
#ifdef HAVE_MALLOC_SIZE
        update_dmalloc_stat_alloc(dmalloc_size(p));
        return p;
#else
        *((size_t*)p) = size;
        update_dmalloc_stat_alloc(size+PREFIX_SIZE);
        return (char*)p+PREFIX_SIZE;
#endif
        log_debug(LOG_VVERB, "malloc(%zu) at %p @ %s:%d", size, p, name, line);
    }

    return p;
}

void *
_dzalloc(size_t size, const char *name, int line)
{
    void *p;

    p = _dalloc(size, name, line);
    if (p != NULL) {
        memset(p, 0, size);
    }

    return p;
}

void *
_dcalloc(size_t nmemb, size_t size, const char *name, int line)
{
    return _dzalloc(nmemb * size, name, line);
}

void *
_drealloc(void *ptr, size_t size, const char *name, int line)
{
#ifndef HAVE_MALLOC_SIZE
    void *realp;
#endif
    void *p;
    size_t oldsize;

    ASSERT(size != 0);

    if (ptr == NULL) return _dalloc(size, name, line);

#ifdef HAVE_MALLOC_SIZE
    oldsize = dmalloc_size(ptr);
#ifdef DUSE_JEMALLOC
    p = je_realloc(ptr, size);
#else
    p = realloc(ptr, size);
#endif
#else
    realp = (char*)ptr-PREFIX_SIZE;
    oldsize = *((size_t*)realp);
#ifdef DUSE_JEMALLOC
    p = je_realloc(ptr, size+PREFIX_SIZE);
#else
    p = realloc(ptr, size+PREFIX_SIZE);
#endif
#endif
    if (p == NULL) {
        log_error("realloc(%zu) failed @ %s:%d", size, name, line);
        return NULL;
    } else {
        log_debug(LOG_VVERB, "realloc(%zu) at %p @ %s:%d", size, p, name, line);
#ifdef HAVE_MALLOC_SIZE
        update_dmalloc_stat_free(oldsize);
        update_dmalloc_stat_alloc(dmalloc_size(p));
        return p;
#else
        *((size_t*)p) = size;
        update_dmalloc_stat_free(oldsize);
        update_dmalloc_stat_alloc(size);
        return p+PREFIX_SIZE;
#endif
    }

    return NULL;
}

void
_dfree(void *ptr, const char *name, int line)
{
#ifndef HAVE_MALLOC_SIZE
    void *realp;
    size_t oldsize;
#endif

    ASSERT(ptr != NULL);
    log_debug(LOG_VVERB, "free(%p) @ %s:%d", ptr, name, line);

#ifdef HAVE_MALLOC_SIZE
    update_dmalloc_stat_free(dmalloc_size(ptr));
#ifdef DUSE_JEMALLOC
    je_free(ptr);
#else
    free(ptr);
#endif
#else
    realp = (char*)ptr-PREFIX_SIZE;
    oldsize = *((size_t*)realp);
    update_dmalloc_stat_free(oldsize+PREFIX_SIZE);
    free(realp);
#ifdef DUSE_JEMALLOC
    je_free(realp);
#else
    free(realp);
#endif
#endif
}

size_t
dalloc_used_memory(void)
{
    size_t um;

#if defined(__ATOMIC_RELAXED) || defined(HAVE_ATOMIC)
    um = update_used_mem_stat_add(0);
#else
    pthread_mutex_lock(&used_memory_mutex);
    um = used_memory;
    pthread_mutex_unlock(&used_memory_mutex);
#endif

    return um;
}

/* Returns the size of physical memory (RAM) in bytes.
 * It looks ugly, but this is the cleanest way to achive cross platform results.
 * Cleaned up from:
 *
 * http://nadeausoftware.com/articles/2012/09/c_c_tip_how_get_physical_memory_size_system
 *
 * Note that this function:
 * 1) Was released under the following CC attribution license:
 *    http://creativecommons.org/licenses/by/3.0/deed.en_US.
 * 2) Was originally implemented by David Robert Nadeau.
 * 3) Was modified for Redis by Matt Stancliff.
 * 4) This note exists in order to comply with the original license.
 */
size_t dalloc_get_memory_size(void) {
#if defined(__unix__) || defined(__unix) || defined(unix) || \
    (defined(__APPLE__) && defined(__MACH__))
#if defined(CTL_HW) && (defined(HW_MEMSIZE) || defined(HW_PHYSMEM64))
    int mib[2];
    mib[0] = CTL_HW;
#if defined(HW_MEMSIZE)
    mib[1] = HW_MEMSIZE;            /* OSX. --------------------- */
#elif defined(HW_PHYSMEM64)
    mib[1] = HW_PHYSMEM64;          /* NetBSD, OpenBSD. --------- */
#endif
    int64_t size = 0;               /* 64-bit */
    size_t len = sizeof(size);
    if (sysctl( mib, 2, &size, &len, NULL, 0) == 0)
        return (size_t)size;
    return 0L;          /* Failed? */

#elif defined(_SC_PHYS_PAGES) && defined(_SC_PAGESIZE)
    /* FreeBSD, Linux, OpenBSD, and Solaris. -------------------- */
    return (size_t)sysconf(_SC_PHYS_PAGES) * (size_t)sysconf(_SC_PAGESIZE);

#elif defined(CTL_HW) && (defined(HW_PHYSMEM) || defined(HW_REALMEM))
    /* DragonFly BSD, FreeBSD, NetBSD, OpenBSD, and OSX. -------- */
    int mib[2];
    mib[0] = CTL_HW;
#if defined(HW_REALMEM)
    mib[1] = HW_REALMEM;        /* FreeBSD. ----------------- */
#elif defined(HW_PYSMEM)
    mib[1] = HW_PHYSMEM;        /* Others. ------------------ */
#endif
    unsigned int size = 0;      /* 32-bit */
    size_t len = sizeof(size);
    if (sysctl(mib, 2, &size, &len, NULL, 0) == 0)
        return (size_t)size;
    return 0L;          /* Failed? */
#endif /* sysctl and sysconf variants */

#else
    return 0L;          /* Unknown OS. */
#endif
}

/* Get the RSS information in an OS-specific way.
 *
 * WARNING: the function zmalloc_get_rss() is not designed to be fast
 * and may not be called in the busy loops where Redis tries to release
 * memory expiring or swapping out objects.
 *
 * For this kind of "fast RSS reporting" usages use instead the
 * function RedisEstimateRSS() that is a much faster (and less precise)
 * version of the function. */

#if defined(HAVE_PROC_STAT)
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>

size_t dalloc_get_rss(void) {
    int page = sysconf(_SC_PAGESIZE);
    size_t rss;
    char buf[4096];
    char filename[256];
    int fd, count;
    char *p, *x;

    snprintf(filename,256,"/proc/%d/stat",getpid());
    if ((fd = open(filename,O_RDONLY)) == -1) return 0;
    if (read(fd,buf,4096) <= 0) {
        close(fd);
        return 0;
    }
    close(fd);

    p = buf;
    count = 23; /* RSS is the 24th field in /proc/<pid>/stat */
    while(p && count--) {
        p = strchr(p,' ');
        if (p) p++;
    }
    if (!p) return 0;
    x = strchr(p,' ');
    if (!x) return 0;
    *x = '\0';

    rss = strtoll(p,NULL,10);
    rss *= page;
    return rss;
}
#elif defined(HAVE_TASKINFO)
#include <unistd.h>
#include <stdio.h>
#include <stdlib.h>
#include <sys/types.h>
#include <sys/sysctl.h>
#include <mach/task.h>
#include <mach/mach_init.h>

size_t dalloc_get_rss(void) {
    task_t task = MACH_PORT_NULL;
    struct task_basic_info t_info;
    mach_msg_type_number_t t_info_count = TASK_BASIC_INFO_COUNT;

    if (task_for_pid(current_task(), getpid(), &task) != KERN_SUCCESS)
        return 0;
    task_info(task, TASK_BASIC_INFO, (task_info_t)&t_info, &t_info_count);

    return t_info.resident_size;
}
#else
size_t dalloc_get_rss(void) {
    /* If we can't get the RSS in an OS-specific way for this system just
     * return the memory usage we estimated in dalloc()..
     *
     * Fragmentation will appear to be always 1 (no fragmentation)
     * of course... */
    return dalloc_used_memory();
}
#endif

/* Fragmentation = RSS / allocated-bytes */
float dalloc_get_fragmentation_ratio(size_t rss) {
    return (float)rss/dalloc_used_memory();
}


================================================
FILE: dep/dmalloc/dmalloc.h
================================================
#ifndef _DMALLOC_H_
#define _DMALLOC_H_

#ifdef HAVE_CONFIG_H
# include <config.h>
#endif

#include <dspecialconfig.h>

#ifdef HAVE_JEMALLOC
# define DUSE_JEMALLOC 1
#endif

/*
 * Memory allocation and free wrappers.
 *
 * These wrappers enables us to loosely detect double free, dangling
 * pointer access and zero-byte alloc.
 */
#if defined(DUSE_JEMALLOC)
#define DMALLOC_LIB ("jemalloc-" __xstr(JEMALLOC_VERSION_MAJOR) "." __xstr(JEMALLOC_VERSION_MINOR) "." __xstr(JEMALLOC_VERSION_BUGFIX))
#include <jemalloc/jemalloc.h>
#if (JEMALLOC_VERSION_MAJOR == 2 && JEMALLOC_VERSION_MINOR >= 1) || (JEMALLOC_VERSION_MAJOR > 2)
#define HAVE_MALLOC_SIZE 1
#define dmalloc_size(p) je_malloc_usable_size(p)
#else
#error "Newer version of jemalloc required"
#endif
#elif defined(__APPLE__)
#include <malloc/malloc.h>
#define HAVE_MALLOC_SIZE 1
#define dmalloc_size(p) malloc_size(p)
#endif
    
#ifndef DMALLOC_LIB
#define DMALLOC_LIB "libc"
#endif

#define dalloc(_s)                    \
    _dalloc((size_t)(_s), __FILE__, __LINE__)

#define dzalloc(_s)                   \
    _dzalloc((size_t)(_s), __FILE__, __LINE__)

#define dcalloc(_n, _s)               \
    _dcalloc((size_t)(_n), (size_t)(_s), __FILE__, __LINE__)

#define drealloc(_p, _s)              \
    _drealloc(_p, (size_t)(_s), __FILE__, __LINE__)

#define dfree(_p) do {                \
    _dfree(_p, __FILE__, __LINE__);   \
} while (0)

char *dmalloc_lock_type(void);

#ifndef HAVE_MALLOC_SIZE
size_t dmalloc_size(void *ptr);
#endif

void *_dalloc(size_t size, const char *name, int line);
void *_dzalloc(size_t size, const char *name, int line);
void *_dcalloc(size_t nmemb, size_t size, const char *name, int line);
void *_drealloc(void *ptr, size_t size, const char *name, int line);
void _dfree(void *ptr, const char *name, int line);

size_t dalloc_used_memory(void);

size_t dalloc_get_memory_size(void);

size_t dalloc_get_rss(void);
float dalloc_get_fragmentation_ratio(size_t rss);

#endif


================================================
FILE: dep/himemcached-0.1.0/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CFLAGS = -Wall -Wshadow
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value

noinst_LIBRARIES = libhimemcached.a

noinst_HEADERS = himemcached.h himcread.h himcdep/sds.h

libhimemcached_a_SOURCES =          \
    himcdep/sds.c himcdep/sds.h     \
    himcread.c himcread.h           \
	himemcached.c himemcached.h

================================================
FILE: dep/himemcached-0.1.0/himcdep/sds.c
================================================
/* SDS (Simple Dynamic Strings), A C dynamic strings library.
 *
 * Copyright (c) 2006-2014, Salvatore Sanfilippo <antirez at gmail dot com>
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <assert.h>

#include "sds.h"

/* Create a new sds string with the content specified by the 'init' pointer
 * and 'initlen'.
 * If NULL is used for 'init' the string is initialized with zero bytes.
 *
 * The string is always null-termined (all the sds strings are, always) so
 * even if you create an sds string with:
 *
 * mystring = sdsnewlen("abc",3");
 *
 * You can print the string with printf() as there is an implicit \0 at the
 * end of the string. However the string is binary safe and can contain
 * \0 characters in the middle, as the length is stored in the sds header. */
sds sdsnewlen(const void *init, size_t initlen) {
    struct sdshdr *sh;

    if (init) {
        sh = malloc(sizeof *sh+initlen+1);
    } else {
        sh = calloc(sizeof *sh+initlen+1,1);
    }
    if (sh == NULL) return NULL;
    sh->len = initlen;
    sh->free = 0;
    if (initlen && init)
        memcpy(sh->buf, init, initlen);
    sh->buf[initlen] = '\0';
    return (char*)sh->buf;
}

/* Create an empty (zero length) sds string. Even in this case the string
 * always has an implicit null term. */
sds sdsempty(void) {
    return sdsnewlen("",0);
}

/* Create a new sds string starting from a null termined C string. */
sds sdsnew(const char *init) {
    size_t initlen = (init == NULL) ? 0 : strlen(init);
    return sdsnewlen(init, initlen);
}

/* Duplicate an sds string. */
sds sdsdup(const sds s) {
    return sdsnewlen(s, sdslen(s));
}

/* Free an sds string. No operation is performed if 's' is NULL. */
void sdsfree(sds s) {
    if (s == NULL) return;
    free(s-sizeof(struct sdshdr));
}

/* Set the sds string length to the length as obtained with strlen(), so
 * considering as content only up to the first null term character.
 *
 * This function is useful when the sds string is hacked manually in some
 * way, like in the following example:
 *
 * s = sdsnew("foobar");
 * s[2] = '\0';
 * sdsupdatelen(s);
 * printf("%d\n", sdslen(s));
 *
 * The output will be "2", but if we comment out the call to sdsupdatelen()
 * the output will be "6" as the string was modified but the logical length
 * remains 6 bytes. */
void sdsupdatelen(sds s) {
    struct sdshdr *sh = (void*) (s-sizeof *sh);
    int reallen = strlen(s);
    sh->free += (sh->len-reallen);
    sh->len = reallen;
}

/* Modify an sds string on-place to make it empty (zero length).
 * However all the existing buffer is not discarded but set as free space
 * so that next append operations will not require allocations up to the
 * number of bytes previously available. */
void sdsclear(sds s) {
    struct sdshdr *sh = (void*) (s-sizeof *sh);
    sh->free += sh->len;
    sh->len = 0;
    sh->buf[0] = '\0';
}

/* Enlarge the free space at the end of the sds string so that the caller
 * is sure that after calling this function can overwrite up to addlen
 * bytes after the end of the string, plus one more byte for nul term.
 *
 * Note: this does not change the *length* of the sds string as returned
 * by sdslen(), but only the free buffer space we have. */
sds sdsMakeRoomFor(sds s, size_t addlen) {
    struct sdshdr *sh, *newsh;
    size_t free = sdsavail(s);
    size_t len, newlen;

    if (free >= addlen) return s;
    len = sdslen(s);
    sh = (void*) (s-sizeof *sh);
    newlen = (len+addlen);
    if (newlen < SDS_MAX_PREALLOC)
        newlen *= 2;
    else
        newlen += SDS_MAX_PREALLOC;
    newsh = realloc(sh, sizeof *newsh+newlen+1);
    if (newsh == NULL) return NULL;

    newsh->free = newlen - len;
    return newsh->buf;
}

/* Reallocate the sds string so that it has no free space at the end. The
 * contained string remains not altered, but next concatenation operations
 * will require a reallocation.
 *
 * After the call, the passed sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdsRemoveFreeSpace(sds s) {
    struct sdshdr *sh;

    sh = (void*) (s-sizeof *sh);
    sh = realloc(sh, sizeof *sh+sh->len+1);
    sh->free = 0;
    return sh->buf;
}

/* Return the total size of the allocation of the specifed sds string,
 * including:
 * 1) The sds header before the pointer.
 * 2) The string.
 * 3) The free buffer at the end if any.
 * 4) The implicit null term.
 */
size_t sdsAllocSize(sds s) {
    struct sdshdr *sh = (void*) (s-sizeof *sh);

    return sizeof(*sh)+sh->len+sh->free+1;
}

/* Increment the sds length and decrements the left free space at the
 * end of the string according to 'incr'. Also set the null term
 * in the new end of the string.
 *
 * This function is used in order to fix the string length after the
 * user calls sdsMakeRoomFor(), writes something after the end of
 * the current string, and finally needs to set the new length.
 *
 * Note: it is possible to use a negative increment in order to
 * right-trim the string.
 *
 * Usage example:
 *
 * Using sdsIncrLen() and sdsMakeRoomFor() it is possible to mount the
 * following schema, to cat bytes coming from the kernel to the end of an
 * sds string without copying into an intermediate buffer:
 *
 * oldlen = sdslen(s);
 * s = sdsMakeRoomFor(s, BUFFER_SIZE);
 * nread = read(fd, s+oldlen, BUFFER_SIZE);
 * ... check for nread <= 0 and handle it ...
 * sdsIncrLen(s, nread);
 */
void sdsIncrLen(sds s, int incr) {
    struct sdshdr *sh = (void*) (s-sizeof *sh);

    assert(sh->free >= incr);
    sh->len += incr;
    sh->free -= incr;
    assert(sh->free >= 0);
    s[sh->len] = '\0';
}

/* Grow the sds to have the specified length. Bytes that were not part of
 * the original length of the sds will be set to zero.
 *
 * if the specified length is smaller than the current length, no operation
 * is performed. */
sds sdsgrowzero(sds s, size_t len) {
    struct sdshdr *sh = (void*) (s-sizeof *sh);
    size_t totlen, curlen = sh->len;

    if (len <= curlen) return s;
    s = sdsMakeRoomFor(s,len-curlen);
    if (s == NULL) return NULL;

    /* Make sure added region doesn't contain garbage */
    sh = (void*)(s-sizeof *sh);
    memset(s+curlen,0,(len-curlen+1)); /* also set trailing \0 byte */
    totlen = sh->len+sh->free;
    sh->len = len;
    sh->free = totlen-sh->len;
    return s;
}

/* Append the specified binary-safe string pointed by 't' of 'len' bytes to the
 * end of the specified sds string 's'.
 *
 * After the call, the passed sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdscatlen(sds s, const void *t, size_t len) {
    struct sdshdr *sh;
    size_t curlen = sdslen(s);

    s = sdsMakeRoomFor(s,len);
    if (s == NULL) return NULL;
    sh = (void*) (s-sizeof *sh);
    memcpy(s+curlen, t, len);
    sh->len = curlen+len;
    sh->free = sh->free-len;
    s[curlen+len] = '\0';
    return s;
}

/* Append the specified null termianted C string to the sds string 's'.
 *
 * After the call, the passed sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdscat(sds s, const char *t) {
    return sdscatlen(s, t, strlen(t));
}

/* Append the specified sds 't' to the existing sds 's'.
 *
 * After the call, the modified sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdscatsds(sds s, const sds t) {
    return sdscatlen(s, t, sdslen(t));
}

/* Destructively modify the sds string 's' to hold the specified binary
 * safe string pointed by 't' of length 'len' bytes. */
sds sdscpylen(sds s, const char *t, size_t len) {
    struct sdshdr *sh = (void*) (s-sizeof *sh);
    size_t totlen = sh->free+sh->len;

    if (totlen < len) {
        s = sdsMakeRoomFor(s,len-sh->len);
        if (s == NULL) return NULL;
        sh = (void*) (s-sizeof *sh);
        totlen = sh->free+sh->len;
    }
    memcpy(s, t, len);
    s[len] = '\0';
    sh->len = len;
    sh->free = totlen-len;
    return s;
}

/* Like sdscpylen() but 't' must be a null-termined string so that the length
 * of the string is obtained with strlen(). */
sds sdscpy(sds s, const char *t) {
    return sdscpylen(s, t, strlen(t));
}

/* Helper for sdscatlonglong() doing the actual number -> string
 * conversion. 's' must point to a string with room for at least
 * SDS_LLSTR_SIZE bytes.
 *
 * The function returns the lenght of the null-terminated string
 * representation stored at 's'. */
#define SDS_LLSTR_SIZE 21
int sdsll2str(char *s, long long value) {
    char *p, aux;
    unsigned long long v;
    size_t l;

    /* Generate the string representation, this method produces
     * an reversed string. */
    v = (value < 0) ? -value : value;
    p = s;
    do {
        *p++ = '0'+(v%10);
        v /= 10;
    } while(v);
    if (value < 0) *p++ = '-';

    /* Compute length and add null term. */
    l = p-s;
    *p = '\0';

    /* Reverse the string. */
    p--;
    while(s < p) {
        aux = *s;
        *s = *p;
        *p = aux;
        s++;
        p--;
    }
    return l;
}

/* Identical sdsll2str(), but for unsigned long long type. */
int sdsull2str(char *s, unsigned long long v) {
    char *p, aux;
    size_t l;

    /* Generate the string representation, this method produces
     * an reversed string. */
    p = s;
    do {
        *p++ = '0'+(v%10);
        v /= 10;
    } while(v);

    /* Compute length and add null term. */
    l = p-s;
    *p = '\0';

    /* Reverse the string. */
    p--;
    while(s < p) {
        aux = *s;
        *s = *p;
        *p = aux;
        s++;
        p--;
    }
    return l;
}

/* Like sdscatpritf() but gets va_list instead of being variadic. */
sds sdscatvprintf(sds s, const char *fmt, va_list ap) {
    va_list cpy;
    char *buf, *t;
    size_t buflen = 16;

    while(1) {
        buf = malloc(buflen);
        if (buf == NULL) return NULL;
        buf[buflen-2] = '\0';
        va_copy(cpy,ap);
        vsnprintf(buf, buflen, fmt, cpy);
        if (buf[buflen-2] != '\0') {
            free(buf);
            buflen *= 2;
            continue;
        }
        break;
    }
    t = sdscat(s, buf);
    free(buf);
    return t;
}

/* Append to the sds string 's' a string obtained using printf-alike format
 * specifier.
 *
 * After the call, the modified sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call.
 *
 * Example:
 *
 * s = sdsnew("Sum is: ");
 * s = sdscatprintf(s,"%d+%d = %d",a,b,a+b);
 *
 * Often you need to create a string from scratch with the printf-alike
 * format. When this is the need, just use sdsempty() as the target string:
 *
 * s = sdscatprintf(sdsempty(), "... your format ...", args);
 */
sds sdscatprintf(sds s, const char *fmt, ...) {
    va_list ap;
    char *t;
    va_start(ap, fmt);
    t = sdscatvprintf(s,fmt,ap);
    va_end(ap);
    return t;
}

/* This function is similar to sdscatprintf, but much faster as it does
 * not rely on sprintf() family functions implemented by the libc that
 * are often very slow. Moreover directly handling the sds string as
 * new data is concatenated provides a performance improvement.
 *
 * However this function only handles an incompatible subset of printf-alike
 * format specifiers:
 *
 * %s - C String
 * %S - SDS string
 * %i - signed int
 * %I - 64 bit signed integer (long long, int64_t)
 * %u - unsigned int
 * %U - 64 bit unsigned integer (unsigned long long, uint64_t)
 * %T - A size_t variable.
 * %% - Verbatim "%" character.
 */
sds sdscatfmt(sds s, char const *fmt, ...) {
    struct sdshdr *sh = (void*) (s-(sizeof(struct sdshdr)));
    size_t initlen = sdslen(s);
    const char *f = fmt;
    int i;
    va_list ap;

    va_start(ap,fmt);
    f = fmt;    /* Next format specifier byte to process. */
    i = initlen; /* Position of the next byte to write to dest str. */
    while(*f) {
        char next, *str;
        int l;
        long long num;
        unsigned long long unum;

        /* Make sure there is always space for at least 1 char. */
        if (sh->free == 0) {
            s = sdsMakeRoomFor(s,1);
            sh = (void*) (s-(sizeof(struct sdshdr)));
        }

        switch(*f) {
        case '%':
            next = *(f+1);
            f++;
            switch(next) {
            case 's':
            case 'S':
                str = va_arg(ap,char*);
                l = (next == 's') ? strlen(str) : sdslen(str);
                if (sh->free < l) {
                    s = sdsMakeRoomFor(s,l);
                    sh = (void*) (s-(sizeof(struct sdshdr)));
                }
                memcpy(s+i,str,l);
                sh->len += l;
                sh->free -= l;
                i += l;
                break;
            case 'i':
            case 'I':
                if (next == 'i')
                    num = va_arg(ap,int);
                else
                    num = va_arg(ap,long long);
                {
                    char buf[SDS_LLSTR_SIZE];
                    l = sdsll2str(buf,num);
                    if (sh->free < l) {
                        s = sdsMakeRoomFor(s,l);
                        sh = (void*) (s-(sizeof(struct sdshdr)));
                    }
                    memcpy(s+i,buf,l);
                    sh->len += l;
                    sh->free -= l;
                    i += l;
                }
                break;
            case 'u':
            case 'U':
            case 'T':
                if (next == 'u')
                    unum = va_arg(ap,unsigned int);
                else if(next == 'U')
                    unum = va_arg(ap,unsigned long long);
                else
                    unum = (unsigned long long)va_arg(ap,size_t);
                {
                    char buf[SDS_LLSTR_SIZE];
                    l = sdsull2str(buf,unum);
                    if (sh->free < l) {
                        s = sdsMakeRoomFor(s,l);
                        sh = (void*) (s-(sizeof(struct sdshdr)));
                    }
                    memcpy(s+i,buf,l);
                    sh->len += l;
                    sh->free -= l;
                    i += l;
                }
                break;
            default: /* Handle %% and generally %<unknown>. */
                s[i++] = next;
                sh->len += 1;
                sh->free -= 1;
                break;
            }
            break;
        default:
            s[i++] = *f;
            sh->len += 1;
            sh->free -= 1;
            break;
        }
        f++;
    }
    va_end(ap);

    /* Add null-term */
    s[i] = '\0';
    return s;
}


/* Remove the part of the string from left and from right composed just of
 * contiguous characters found in 'cset', that is a null terminted C string.
 *
 * After the call, the modified sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call.
 *
 * Example:
 *
 * s = sdsnew("AA...AA.a.aa.aHelloWorld     :::");
 * s = sdstrim(s,"A. :");
 * printf("%s\n", s);
 *
 * Output will be just "Hello World".
 */
void sdstrim(sds s, const char *cset) {
    struct sdshdr *sh = (void*) (s-sizeof *sh);
    char *start, *end, *sp, *ep;
    size_t len;

    sp = start = s;
    ep = end = s+sdslen(s)-1;
    while(sp <= end && strchr(cset, *sp)) sp++;
    while(ep > start && strchr(cset, *ep)) ep--;
    len = (sp > ep) ? 0 : ((ep-sp)+1);
    if (sh->buf != sp) memmove(sh->buf, sp, len);
    sh->buf[len] = '\0';
    sh->free = sh->free+(sh->len-len);
    sh->len = len;
}

/* Turn the string into a smaller (or equal) string containing only the
 * substring specified by the 'start' and 'end' indexes.
 *
 * start and end can be negative, where -1 means the last character of the
 * string, -2 the penultimate character, and so forth.
 *
 * The interval is inclusive, so the start and end characters will be part
 * of the resulting string.
 *
 * The string is modified in-place.
 *
 * Example:
 *
 * s = sdsnew("Hello World");
 * sdsrange(s,1,-1); => "ello World"
 */
void sdsrange(sds s, int start, int end) {
    struct sdshdr *sh = (void*) (s-sizeof *sh);
    size_t newlen, len = sdslen(s);

    if (len == 0) return;
    if (start < 0) {
        start = len+start;
        if (start < 0) start = 0;
    }
    if (end < 0) {
        end = len+end;
        if (end < 0) end = 0;
    }
    newlen = (start > end) ? 0 : (end-start)+1;
    if (newlen != 0) {
        if (start >= (signed)len) {
            newlen = 0;
        } else if (end >= (signed)len) {
            end = len-1;
            newlen = (start > end) ? 0 : (end-start)+1;
        }
    } else {
        start = 0;
    }
    if (start && newlen) memmove(sh->buf, sh->buf+start, newlen);
    sh->buf[newlen] = 0;
    sh->free = sh->free+(sh->len-newlen);
    sh->len = newlen;
}

/* Apply tolower() to every character of the sds string 's'. */
void sdstolower(sds s) {
    int len = sdslen(s), j;

    for (j = 0; j < len; j++) s[j] = tolower(s[j]);
}

/* Apply toupper() to every character of the sds string 's'. */
void sdstoupper(sds s) {
    int len = sdslen(s), j;

    for (j = 0; j < len; j++) s[j] = toupper(s[j]);
}

/* Compare two sds strings s1 and s2 with memcmp().
 *
 * Return value:
 *
 *     1 if s1 > s2.
 *    -1 if s1 < s2.
 *     0 if s1 and s2 are exactly the same binary string.
 *
 * If two strings share exactly the same prefix, but one of the two has
 * additional characters, the longer string is considered to be greater than
 * the smaller one. */
int sdscmp(const sds s1, const sds s2) {
    size_t l1, l2, minlen;
    int cmp;

    l1 = sdslen(s1);
    l2 = sdslen(s2);
    minlen = (l1 < l2) ? l1 : l2;
    cmp = memcmp(s1,s2,minlen);
    if (cmp == 0) return l1-l2;
    return cmp;
}

/* Split 's' with separator in 'sep'. An array
 * of sds strings is returned. *count will be set
 * by reference to the number of tokens returned.
 *
 * On out of memory, zero length string, zero length
 * separator, NULL is returned.
 *
 * Note that 'sep' is able to split a string using
 * a multi-character separator. For example
 * sdssplit("foo_-_bar","_-_"); will return two
 * elements "foo" and "bar".
 *
 * This version of the function is binary-safe but
 * requires length arguments. sdssplit() is just the
 * same function but for zero-terminated strings.
 */
sds *sdssplitlen(const char *s, int len, const char *sep, int seplen, int *count) {
    int elements = 0, slots = 5, start = 0, j;
    sds *tokens;

    if (seplen < 1 || len < 0) return NULL;

    tokens = malloc(sizeof(sds)*slots);
    if (tokens == NULL) return NULL;

    if (len == 0) {
        *count = 0;
        return tokens;
    }
    for (j = 0; j < (len-(seplen-1)); j++) {
        /* make sure there is room for the next element and the final one */
        if (slots < elements+2) {
            sds *newtokens;

            slots *= 2;
            newtokens = realloc(tokens,sizeof(sds)*slots);
            if (newtokens == NULL) goto cleanup;
            tokens = newtokens;
        }
        /* search the separator */
        if ((seplen == 1 && *(s+j) == sep[0]) || (memcmp(s+j,sep,seplen) == 0)) {
            tokens[elements] = sdsnewlen(s+start,j-start);
            if (tokens[elements] == NULL) goto cleanup;
            elements++;
            start = j+seplen;
            j = j+seplen-1; /* skip the separator */
        }
    }
    /* Add the final element. We are sure there is room in the tokens array. */
    tokens[elements] = sdsnewlen(s+start,len-start);
    if (tokens[elements] == NULL) goto cleanup;
    elements++;
    *count = elements;
    return tokens;

cleanup:
    {
        int i;
        for (i = 0; i < elements; i++) sdsfree(tokens[i]);
        free(tokens);
        *count = 0;
        return NULL;
    }
}

/* Free the result returned by sdssplitlen(), or do nothing if 'tokens' is NULL. */
void sdsfreesplitres(sds *tokens, int count) {
    if (!tokens) return;
    while(count--)
        sdsfree(tokens[count]);
    free(tokens);
}

/* Create an sds string from a long long value. It is much faster than:
 *
 * sdscatprintf(sdsempty(),"%lld\n", value);
 */
sds sdsfromlonglong(long long value) {
    char buf[32], *p;
    unsigned long long v;

    v = (value < 0) ? -value : value;
    p = buf+31; /* point to the last character */
    do {
        *p-- = '0'+(v%10);
        v /= 10;
    } while(v);
    if (value < 0) *p-- = '-';
    p++;
    return sdsnewlen(p,32-(p-buf));
}

/* Append to the sds string "s" an escaped string representation where
 * all the non-printable characters (tested with isprint()) are turned into
 * escapes in the form "\n\r\a...." or "\x<hex-number>".
 *
 * After the call, the modified sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdscatrepr(sds s, const char *p, size_t len) {
    s = sdscatlen(s,"\"",1);
    while(len--) {
        switch(*p) {
        case '\\':
        case '"':
            s = sdscatprintf(s,"\\%c",*p);
            break;
        case '\n': s = sdscatlen(s,"\\n",2); break;
        case '\r': s = sdscatlen(s,"\\r",2); break;
        case '\t': s = sdscatlen(s,"\\t",2); break;
        case '\a': s = sdscatlen(s,"\\a",2); break;
        case '\b': s = sdscatlen(s,"\\b",2); break;
        default:
            if (isprint(*p))
                s = sdscatprintf(s,"%c",*p);
            else
                s = sdscatprintf(s,"\\x%02x",(unsigned char)*p);
            break;
        }
        p++;
    }
    return sdscatlen(s,"\"",1);
}

/* Helper function for sdssplitargs() that returns non zero if 'c'
 * is a valid hex digit. */
int is_hex_digit(char c) {
    return (c >= '0' && c <= '9') || (c >= 'a' && c <= 'f') ||
           (c >= 'A' && c <= 'F');
}

/* Helper function for sdssplitargs() that converts a hex digit into an
 * integer from 0 to 15 */
int hex_digit_to_int(char c) {
    switch(c) {
    case '0': return 0;
    case '1': return 1;
    case '2': return 2;
    case '3': return 3;
    case '4': return 4;
    case '5': return 5;
    case '6': return 6;
    case '7': return 7;
    case '8': return 8;
    case '9': return 9;
    case 'a': case 'A': return 10;
    case 'b': case 'B': return 11;
    case 'c': case 'C': return 12;
    case 'd': case 'D': return 13;
    case 'e': case 'E': return 14;
    case 'f': case 'F': return 15;
    default: return 0;
    }
}

/* Split a line into arguments, where every argument can be in the
 * following programming-language REPL-alike form:
 *
 * foo bar "newline are supported\n" and "\xff\x00otherstuff"
 *
 * The number of arguments is stored into *argc, and an array
 * of sds is returned.
 *
 * The caller should free the resulting array of sds strings with
 * sdsfreesplitres().
 *
 * Note that sdscatrepr() is able to convert back a string into
 * a quoted string in the same format sdssplitargs() is able to parse.
 *
 * The function returns the allocated tokens on success, even when the
 * input string is empty, or NULL if the input contains unbalanced
 * quotes or closed quotes followed by non space characters
 * as in: "foo"bar or "foo'
 */
sds *sdssplitargs(const char *line, int *argc) {
    const char *p = line;
    char *current = NULL;
    char **vector = NULL;

    *argc = 0;
    while(1) {
        /* skip blanks */
        while(*p && isspace(*p)) p++;
        if (*p) {
            /* get a token */
            int inq=0;  /* set to 1 if we are in "quotes" */
            int insq=0; /* set to 1 if we are in 'single quotes' */
            int done=0;

            if (current == NULL) current = sdsempty();
            while(!done) {
                if (inq) {
                    if (*p == '\\' && *(p+1) == 'x' &&
                                             is_hex_digit(*(p+2)) &&
                                             is_hex_digit(*(p+3)))
                    {
                        unsigned char byte;

                        byte = (hex_digit_to_int(*(p+2))*16)+
                                hex_digit_to_int(*(p+3));
                        current = sdscatlen(current,(char*)&byte,1);
                        p += 3;
                    } else if (*p == '\\' && *(p+1)) {
                        char c;

                        p++;
                        switch(*p) {
                        case 'n': c = '\n'; break;
                        case 'r': c = '\r'; break;
                        case 't': c = '\t'; break;
                        case 'b': c = '\b'; break;
                        case 'a': c = '\a'; break;
                        default: c = *p; break;
                        }
                        current = sdscatlen(current,&c,1);
                    } else if (*p == '"') {
                        /* closing quote must be followed by a space or
                         * nothing at all. */
                        if (*(p+1) && !isspace(*(p+1))) goto err;
                        done=1;
                    } else if (!*p) {
                        /* unterminated quotes */
                        goto err;
                    } else {
                        current = sdscatlen(current,p,1);
                    }
                } else if (insq) {
                    if (*p == '\\' && *(p+1) == '\'') {
                        p++;
                        current = sdscatlen(current,"'",1);
                    } else if (*p == '\'') {
                        /* closing quote must be followed by a space or
                         * nothing at all. */
                        if (*(p+1) && !isspace(*(p+1))) goto err;
                        done=1;
                    } else if (!*p) {
                        /* unterminated quotes */
                        goto err;
                    } else {
                        current = sdscatlen(current,p,1);
                    }
                } else {
                    switch(*p) {
                    case ' ':
                    case '\n':
                    case '\r':
                    case '\t':
                    case '\0':
                        done=1;
                        break;
                    case '"':
                        inq=1;
                        break;
                    case '\'':
                        insq=1;
                        break;
                    default:
                        current = sdscatlen(current,p,1);
                        break;
                    }
                }
                if (*p) p++;
            }
            /* add the token to the vector */
            vector = realloc(vector,((*argc)+1)*sizeof(char*));
            vector[*argc] = current;
            (*argc)++;
            current = NULL;
        } else {
            /* Even on empty input string return something not NULL. */
            if (vector == NULL) vector = malloc(sizeof(void*));
            return vector;
        }
    }

err:
    while((*argc)--)
        sdsfree(vector[*argc]);
    free(vector);
    if (current) sdsfree(current);
    *argc = 0;
    return NULL;
}

/* Modify the string substituting all the occurrences of the set of
 * characters specified in the 'from' string to the corresponding character
 * in the 'to' array.
 *
 * For instance: sdsmapchars(mystring, "ho", "01", 2)
 * will have the effect of turning the string "hello" into "0ell1".
 *
 * The function returns the sds string pointer, that is always the same
 * as the input pointer since no resize is needed. */
sds sdsmapchars(sds s, const char *from, const char *to, size_t setlen) {
    size_t j, i, l = sdslen(s);

    for (j = 0; j < l; j++) {
        for (i = 0; i < setlen; i++) {
            if (s[j] == from[i]) {
                s[j] = to[i];
                break;
            }
        }
    }
    return s;
}

/* Join an array of C strings using the specified separator (also a C string).
 * Returns the result as an sds string. */
sds sdsjoin(char **argv, int argc, char *sep, size_t seplen) {
    sds join = sdsempty();
    int j;

    for (j = 0; j < argc; j++) {
        join = sdscat(join, argv[j]);
        if (j != argc-1) join = sdscatlen(join,sep,seplen);
    }
    return join;
}

/* Like sdsjoin, but joins an array of SDS strings. */
sds sdsjoinsds(sds *argv, int argc, const char *sep, size_t seplen) {
    sds join = sdsempty();
    int j;

    for (j = 0; j < argc; j++) {
        join = sdscatsds(join, argv[j]);
        if (j != argc-1) join = sdscatlen(join,sep,seplen);
    }
    return join;
}

#ifdef SDS_TEST_MAIN
#include <stdio.h>
#include "testhelp.h"

int main(void) {
    {
        struct sdshdr *sh;
        sds x = sdsnew("foo"), y;

        test_cond("Create a string and obtain the length",
            sdslen(x) == 3 && memcmp(x,"foo\0",4) == 0)

        sdsfree(x);
        x = sdsnewlen("foo",2);
        test_cond("Create a string with specified length",
            sdslen(x) == 2 && memcmp(x,"fo\0",3) == 0)

        x = sdscat(x,"bar");
        test_cond("Strings concatenation",
            sdslen(x) == 5 && memcmp(x,"fobar\0",6) == 0);

        x = sdscpy(x,"a");
        test_cond("sdscpy() against an originally longer string",
            sdslen(x) == 1 && memcmp(x,"a\0",2) == 0)

        x = sdscpy(x,"xyzxxxxxxxxxxyyyyyyyyyykkkkkkkkkk");
        test_cond("sdscpy() against an originally shorter string",
            sdslen(x) == 33 &&
            memcmp(x,"xyzxxxxxxxxxxyyyyyyyyyykkkkkkkkkk\0",33) == 0)

        sdsfree(x);
        x = sdscatprintf(sdsempty(),"%d",123);
        test_cond("sdscatprintf() seems working in the base case",
            sdslen(x) == 3 && memcmp(x,"123\0",4) ==0)

        sdsfree(x);
        x = sdsnew("xxciaoyyy");
        sdstrim(x,"xy");
        test_cond("sdstrim() correctly trims characters",
            sdslen(x) == 4 && memcmp(x,"ciao\0",5) == 0)

        y = sdsdup(x);
        sdsrange(y,1,1);
        test_cond("sdsrange(...,1,1)",
            sdslen(y) == 1 && memcmp(y,"i\0",2) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,1,-1);
        test_cond("sdsrange(...,1,-1)",
            sdslen(y) == 3 && memcmp(y,"iao\0",4) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,-2,-1);
        test_cond("sdsrange(...,-2,-1)",
            sdslen(y) == 2 && memcmp(y,"ao\0",3) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,2,1);
        test_cond("sdsrange(...,2,1)",
            sdslen(y) == 0 && memcmp(y,"\0",1) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,1,100);
        test_cond("sdsrange(...,1,100)",
            sdslen(y) == 3 && memcmp(y,"iao\0",4) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,100,100);
        test_cond("sdsrange(...,100,100)",
            sdslen(y) == 0 && memcmp(y,"\0",1) == 0)

        sdsfree(y);
        sdsfree(x);
        x = sdsnew("foo");
        y = sdsnew("foa");
        test_cond("sdscmp(foo,foa)", sdscmp(x,y) > 0)

        sdsfree(y);
        sdsfree(x);
        x = sdsnew("bar");
        y = sdsnew("bar");
        test_cond("sdscmp(bar,bar)", sdscmp(x,y) == 0)

        sdsfree(y);
        sdsfree(x);
        x = sdsnew("aar");
        y = sdsnew("bar");
        test_cond("sdscmp(bar,bar)", sdscmp(x,y) < 0)

        sdsfree(y);
        sdsfree(x);
        x = sdsnewlen("\a\n\0foo\r",7);
        y = sdscatrepr(sdsempty(),x,sdslen(x));
        test_cond("sdscatrepr(...data...)",
            memcmp(y,"\"\\a\\n\\x00foo\\r\"",15) == 0)

        {
            int oldfree;

            sdsfree(x);
            x = sdsnew("0");
            sh = (void*) (x-(sizeof(struct sdshdr)));
            test_cond("sdsnew() free/len buffers", sh->len == 1 && sh->free == 0);
            x = sdsMakeRoomFor(x,1);
            sh = (void*) (x-(sizeof(struct sdshdr)));
            test_cond("sdsMakeRoomFor()", sh->len == 1 && sh->free > 0);
            oldfree = sh->free;
            x[1] = '1';
            sdsIncrLen(x,1);
            test_cond("sdsIncrLen() -- content", x[0] == '0' && x[1] == '1');
            test_cond("sdsIncrLen() -- len", sh->len == 2);
            test_cond("sdsIncrLen() -- free", sh->free == oldfree-1);
        }
    }
    test_report()
    return 0;
}
#endif


================================================
FILE: dep/himemcached-0.1.0/himcdep/sds.h
================================================
/* SDS (Simple Dynamic Strings), A C dynamic strings library.
 *
 * Copyright (c) 2006-2014, Salvatore Sanfilippo <antirez at gmail dot com>
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#ifndef __SDS_H
#define __SDS_H

#define SDS_MAX_PREALLOC (1024*1024)

#include <sys/types.h>
#include <stdarg.h>
#ifdef _MSC_VER
#include "win32.h"
#endif

typedef char *sds;

struct sdshdr {
    int len;
    int free;
    char buf[];
};

static inline size_t sdslen(const sds s) {
    struct sdshdr *sh = (struct sdshdr *)(s-sizeof *sh);
    return sh->len;
}

static inline size_t sdsavail(const sds s) {
    struct sdshdr *sh = (struct sdshdr *)(s-sizeof *sh);
    return sh->free;
}

sds sdsnewlen(const void *init, size_t initlen);
sds sdsnew(const char *init);
sds sdsempty(void);
size_t sdslen(const sds s);
sds sdsdup(const sds s);
void sdsfree(sds s);
size_t sdsavail(const sds s);
sds sdsgrowzero(sds s, size_t len);
sds sdscatlen(sds s, const void *t, size_t len);
sds sdscat(sds s, const char *t);
sds sdscatsds(sds s, const sds t);
sds sdscpylen(sds s, const char *t, size_t len);
sds sdscpy(sds s, const char *t);

sds sdscatvprintf(sds s, const char *fmt, va_list ap);
#ifdef __GNUC__
sds sdscatprintf(sds s, const char *fmt, ...)
    __attribute__((format(printf, 2, 3)));
#else
sds sdscatprintf(sds s, const char *fmt, ...);
#endif

sds sdscatfmt(sds s, char const *fmt, ...);
void sdstrim(sds s, const char *cset);
void sdsrange(sds s, int start, int end);
void sdsupdatelen(sds s);
void sdsclear(sds s);
int sdscmp(const sds s1, const sds s2);
sds *sdssplitlen(const char *s, int len, const char *sep, int seplen, int *count);
void sdsfreesplitres(sds *tokens, int count);
void sdstolower(sds s);
void sdstoupper(sds s);
sds sdsfromlonglong(long long value);
sds sdscatrepr(sds s, const char *p, size_t len);
sds *sdssplitargs(const char *line, int *argc);
sds sdsmapchars(sds s, const char *from, const char *to, size_t setlen);
sds sdsjoin(char **argv, int argc, char *sep, size_t seplen);
sds sdsjoinsds(sds *argv, int argc, const char *sep, size_t seplen);

/* Low level functions exposed to the user API */
sds sdsMakeRoomFor(sds s, size_t addlen);
void sdsIncrLen(sds s, int incr);
sds sdsRemoveFreeSpace(sds s);
size_t sdsAllocSize(sds s);

#endif


================================================
FILE: dep/himemcached-0.1.0/himcread.c
================================================
#include <string.h>
#include <stdlib.h>
#ifndef _MSC_VER
#include <unistd.h>
#endif
#include <assert.h>
#include <errno.h>
#include <ctype.h>

#include "himcread.h"
#include "himcdep/sds.h"

#define PARSE_OK    0        /* Parsing ok */
#define PARSE_ERROR 1        /* Parsing error */
#define PARSE_AGAIN 3        /* Incomplete -> parse again */

#define RSP_TYPE_UNKNOWN        0
#define RSP_TYPE_NUM            1
#define RSP_TYPE_STORED         2
#define RSP_TYPE_NOT_STORED     3
#define RSP_TYPE_EXISTS         4
#define RSP_TYPE_NOT_FOUND      5
#define RSP_TYPE_END            6
#define RSP_TYPE_VALUE          7
#define RSP_TYPE_DELETED        8
#define RSP_TYPE_ERROR          9
#define RSP_TYPE_CLIENT_ERROR   10
#define RSP_TYPE_SERVER_ERROR   11

static void memcachedReaderReset(mcReader *r);

static void __memcachedReaderSetError(mcReader *r, int type, const char *str) {
    size_t len;

    memcachedReaderReset(r);

    /* Clear input buffer on errors. */
    if (r->buf != NULL) {
        sdsfree(r->buf);
        r->buf = NULL;
        r->pos = r->len = 0;
    }

    /* Set error. */
    r->err = type;
    len = strlen(str);
    len = len < (sizeof(r->errstr)-1) ? len : (sizeof(r->errstr)-1);
    memcpy(r->errstr,str,len);
    r->errstr[len] = '\0';
}

static size_t chrtos(char *buf, size_t size, char byte) 
{
    size_t len = 0;

    switch(byte) {
    case '\\':
    case '"':
        len = snprintf(buf,size,"\"\\%c\"",byte);
        break;
    case '\n': len = snprintf(buf,size,"\"\\n\""); break;
    case '\r': len = snprintf(buf,size,"\"\\r\""); break;
    case '\t': len = snprintf(buf,size,"\"\\t\""); break;
    case '\a': len = snprintf(buf,size,"\"\\a\""); break;
    case '\b': len = snprintf(buf,size,"\"\\b\""); break;
    default:
        if (isprint(byte))
            len = snprintf(buf,size,"\"%c\"",byte);
        else
            len = snprintf(buf,size,"\"\\x%02x\"",(unsigned char)byte);
        break;
    }

    return len;
}

static void __memcachedReaderSetErrorProtocolByte(mcReader *r, char byte) {
    char cbuf[8], sbuf[128];

    chrtos(cbuf,sizeof(cbuf),byte);
    snprintf(sbuf,sizeof(sbuf),
        "Protocol error, got %s as reply type byte", cbuf);
    __memcachedReaderSetError(r,MC_ERR_PROTOCOL,sbuf);
}

static void __memcachedReaderSetErrorOOM(mcReader *r) {
    __memcachedReaderSetError(r,MC_ERR_OOM,"Out of memory");
}

static int elementArrayCreate(mcReader *r)
{
    assert(r->alloc_len == 0);
    assert(r->element == NULL);
    assert(r->elements == 0);

    r->element = malloc(10*sizeof(void*));
    if (r->element == NULL) {
        __memcachedReaderSetErrorOOM(r);
        return MC_ERR;
    }
    r->alloc_len = 10;
    r->elements = 0;
    
    return MC_OK;
}

static void elementArrayDestroy(mcReader *r)
{
    unsigned int i;

    if (r->element == NULL)
        return;

    if (r->fn && r->fn->freeObject) {
        for (i = 0; i < r->elements; i ++) {
            if (r->element[i])
                r->fn->freeObject(r->element[i]);
        }
    }
    free(r->element);
    r->element = NULL;
    r->elements = 0;
    r->alloc_len = 0;
    
    return MC_OK;
}

#define EXPAND_MAX_SIZE_PER_TIME 300
static int elementArrayExpand(mcReader *r) 
{
    size_t new_length;
    if (r->alloc_len <= 150) {
        new_length = r->alloc_len*2;
    } else if (r->alloc_len <= 500) {
        new_length = r->alloc_len+EXPAND_MAX_SIZE_PER_TIME;
    }
    r->element = realloc(r->element,new_length*sizeof(void*));
    if (r->element == NULL) {
        __memcachedReaderSetErrorOOM(r);
        return MC_ERR;
    }
    r->alloc_len = new_length;

    return MC_OK;
}

static int elementArrayAdd(mcReader *r, void *reply)
{
    assert(r->elements <= r->alloc_len);
    if (r->elements == r->alloc_len) {
        if (elementArrayExpand(r) != MC_OK)
            return MC_ERR;
    }
    r->element[r->elements++] = reply;

    return MC_OK;
}

static void memcachedParseResponse(mcReader *r)
{
    void *obj;
    char *p, *m;
    char ch;
    enum {
        SW_START,
        SW_RSP_NUM,
        SW_RSP_STR,
        SW_SPACES_BEFORE_KEY,
        SW_KEY,
        SW_SPACES_BEFORE_FLAGS,     /* 5 */
        SW_FLAGS,
        SW_SPACES_BEFORE_VLEN,
        SW_VLEN,
        SW_RUNTO_VAL,
        SW_VAL,                     /* 10 */
        SW_VAL_LF,
        SW_END,
        SW_RUNTO_CRLF,
        SW_CRLF,
        SW_ALMOST_DONE,             /* 15 */
        SW_SENTINEL
    } state;

    state = r->state;

    assert(state >= SW_START && state < SW_SENTINEL);

    /* validate the parsing marker */
    assert(r->buf != NULL);
    assert(r->pos < r->len);

    for (p = r->buf+r->pos; p <= r->buf+r->len; p++) {
        ch = *p;

        switch (state) {
        case SW_START:
            if (isdigit(ch)) {
                state = SW_RSP_NUM;
            } else {
                state = SW_RSP_STR;
            }
            p = p - 1; /* go back by 1 byte */

            break;

        case SW_RSP_NUM:
            if (r->token == NULL) {
                /* rsp_start <- p; type_start <- p */
                r->token = p;
            }

            if (isdigit(ch)) {
                /* num <- num * 10 + (ch - '0') */
                r->integer = r->integer*10 + (long long)(ch-'0');
            } else if (ch == ' ' || ch == '\r') {
                /* type_end <- p - 1 */
                r->token = NULL;
                r->integer = 0;
                r->type = RSP_TYPE_NUM;
                p = p - 1; /* go back by 1 byte */
                state = SW_CRLF;
            } else {
                goto error;
            }

            break;

        case SW_RSP_STR:
            if (r->token == NULL) {
                /* rsp_start <- p; type_start <- p */
                r->token = p;
            }

            if (ch == ' ' || ch == '\r') {
                /* type_end <- p - 1 */
                m = r->token;
                /* r->token = NULL; */
                r->type = RSP_TYPE_UNKNOWN;
                assert(r->str == NULL && r->strlen == 0);
                
                switch (p - m) {
                case 3:
                    if (!strncmp(m,"END\r",4)) {
                        r->type = RSP_TYPE_END;
                        /* end_start <- m; end_end <- p - 1 */
                    }

                    break;

                case 5:
                    if (!strncmp(m,"VALUE",5)) {
                        /*
                                           * Encompasses responses for 'get', 'gets' and
                                           * 'cas' command.
                                           */
                        r->type = RSP_TYPE_VALUE;
                        break;
                    }

                    if (!strncmp(m,"ERROR",5)) {
                        r->type = RSP_TYPE_ERROR;
                        break;
                    }

                    break;

                case 6:
                    if (!strncmp(m,"STORED",6)) {
                        r->type = RSP_TYPE_STORED;

                        r->str = m;
                        r->strlen = 6;
                        break;
                    }

                    if (!strncmp(m,"EXISTS",6)) {
                        r->type = RSP_TYPE_EXISTS;

                        r->str = m;
                        r->strlen = 6;
                        break;
                    }

                    break;

                case 7:
                    if (!strncmp(m,"DELETED",7)) {
                        r->type = RSP_TYPE_DELETED;
                        
                        r->str = m;
                        r->strlen = 7;
                        break;
                    }

                    break;

                case 9:
                    if (!strncmp(m,"NOT_FOUND",9)) {
                        r->type = RSP_TYPE_NOT_FOUND;

                        r->str = m;
                        r->strlen = 9;
                        break;
                    }

                    break;

                case 10:
                    if (!strncmp(m,"NOT_STORED",10)) {
                        r->type = RSP_TYPE_NOT_STORED;

                        r->str = m;
                        r->strlen = 10;
                        break;
                    }

                    break;

                case 12:
                    if (!strncmp(m,"CLIENT_ERROR",12)) {
                        r->type = RSP_TYPE_CLIENT_ERROR;
                        break;
                    }

                    if (!strncmp(m,"SERVER_ERROR",12)) {
                        r->type = RSP_TYPE_SERVER_ERROR;
                        break;
                    }

                    break;
                }

                switch (r->type) {
                case RSP_TYPE_UNKNOWN:
                    goto error;

                case RSP_TYPE_STORED:
                case RSP_TYPE_NOT_STORED:
                case RSP_TYPE_EXISTS:
                case RSP_TYPE_NOT_FOUND:
                case RSP_TYPE_DELETED:
                    state = SW_CRLF;
                    break;

                case RSP_TYPE_END:
                    state = SW_CRLF;
                    break;

                case RSP_TYPE_VALUE:
                    state = SW_SPACES_BEFORE_KEY;
                    break;

                case RSP_TYPE_ERROR:
                    state = SW_CRLF;
                    break;

                case RSP_TYPE_CLIENT_ERROR:
                case RSP_TYPE_SERVER_ERROR:
                    r->token = NULL;
                    state = SW_RUNTO_CRLF;
                    break;

                default:
                    NOT_REACHED();
                }

                p = p - 1; /* go back by 1 byte */
            }

            break;

        case SW_SPACES_BEFORE_KEY:
            if (ch != ' ') {
                state = SW_KEY;
                p = p - 1; /* go back by 1 byte */
                r->token = NULL;
            }

            break;

        case SW_KEY:
            if (r->token == NULL) {
                r->token = p;
            }
            
            if (ch == ' ') {
                assert(r->str == NULL && r->strlen == 0);
                m = r->token;
                r->token = NULL;
                state = SW_SPACES_BEFORE_FLAGS;
                r->strlen = p-m;
                r->str = m;
            }

            break;

        case SW_SPACES_BEFORE_FLAGS:
            if (ch != ' ') {
                if (!isdigit(ch)) {
                    goto error;
                }
                state = SW_FLAGS;
                p = p - 1; /* go back by 1 byte */
                r->kflags = 0;
            }

            break;

        case SW_FLAGS:
            if (isdigit(ch)) {
                /* flags <- flags * 10 + (ch - '0') */
                r->kflags = r->kflags*10 + (int)(ch-'0');
            } else if (ch == ' ') {
                /* flags_end <- p - 1 */
                /* r->token = NULL; */
                state = SW_SPACES_BEFORE_VLEN;
            } else {
                goto error;
            }

            break;

        case SW_SPACES_BEFORE_VLEN:
            if (ch != ' ') {
                if (!isdigit(ch)) {
                    goto error;
                }
                p = p - 1; /* go back by 1 byte */
                state = SW_VLEN;
                r->integer = 0;
            }

            break;

        case SW_VLEN:
            if (isdigit(ch)) {
                r->integer = r->integer*10 + (long long)(ch-'0');
            } else if (ch == ' ' || ch == '\r') {
                /* vlen_end <- p - 1 */
                p = p - 1; /* go back by 1 byte */
                /* r->token = NULL; */
                state = SW_RUNTO_CRLF;
            } else {
                goto error;
            }

            break;

        case SW_RUNTO_VAL:
            switch (ch) {
            case '\n':
                /* val_start <- p + 1 */
                state = SW_VAL;
                r->token = NULL;
                break;

            default:
                goto error;
            }

            break;

        case SW_VAL:
            if (r->token == NULL) {
                /* flags_start <- p */
                r->token = p;
            }

            m = r->token + r->integer;
            if (m > r->buf+r->len) {
                p = r->buf + r->len;
                break;
            }
            
            switch (*m) {
            case '\r':
                /* val_end <- p - 1 */
                p = m; /* move forward by vlen bytes */
                state = SW_VAL_LF;
                break;

            default:
                goto error;
            }

            break;

        case SW_VAL_LF:
            switch (ch) {
            case '\n':
                /* state = SW_END; */
                if (r->fn && r->fn->createString)
                    obj = r->fn->createString(MC_REPLY_STRING,r->str,r->strlen,
                        r->token,r->integer,r->kflags,r->kversion);
                else
                    obj = (void*)MC_REPLY_STRING;
                if (r->element) {
                    assert(r->subreply == NULL);
                    elementArrayAdd(r,r->subreply);
                } else if (r->subreply) {
                    elementArrayCreate(r);
                    elementArrayAdd(r,r->subreply);
                    r->subreply = NULL;
                    elementArrayAdd(r,obj);
                } else {
                    r->subreply = obj;
                }
                
                r->token = NULL;
                r->str = NULL;
                r->strlen = 0;
                r->kflags = 0;
                r->kversion = -1;
                state = SW_RSP_STR;
                break;

            default:
                goto error;
            }

            break;

        case SW_END:
            if (r->token == NULL) {
                if (ch != 'E') {
                    goto error;
                }
                /* end_start <- p */
                r->token = p;
            } else if (ch == '\r') {
                /* end_end <- p */
                m = r->token;
                r->token = NULL;

                switch (p - m) {
                case 3:
                    if (!strncmp(m,"END\r",4)) {
                        state = SW_ALMOST_DONE;
                    }
                    break;

                default:
                    goto error;
                }
            }

            break;

        case SW_RUNTO_CRLF:
            switch (ch) {
            case '\r':
                if (r->type == RSP_TYPE_VALUE) {
                    state = SW_RUNTO_VAL;
                } else {
                    if (r->type == RSP_TYPE_CLIENT_ERROR || 
                        r->type == RSP_TYPE_SERVER_ERROR) {
                        m = r->token;
                        r->token = NULL;
                        r->strlen = p-m;
                        r->str = m;
                    }
                    state = SW_ALMOST_DONE;
                }

                break;

            default:
                break;
            }

            break;

        case SW_CRLF:
            switch (ch) {
            case ' ':
                break;

            case '\r':
                state = SW_ALMOST_DONE;
                break;

            default:
                goto error;
            }

            break;

        case SW_ALMOST_DONE:
            switch (ch) {
            case '\n':
                /* rsp_end <- p */
                goto done;

            default:
                goto error;
            }

            break;

        case SW_SENTINEL:
        default:
            NOT_REACHED();
            break;

        }
    }

    assert(p == r->buf+r->len);
    r->pos = r->len;
    r->state = state;
    
    r->result = PARSE_AGAIN;

    return;

done:
    r->pos = p-r->buf+1;
    assert(r->pos <= r->len);
    r->state = SW_START;
    r->token = NULL;
    r->result = PARSE_OK;

    return;

error:
    r->result = PARSE_ERROR;
    r->state = state;
    errno = EINVAL;
}

mcReader *memcachedReaderCreateWithFunctions(mcReplyObjectFunctions *fn) 
{
    mcReader *r;

    r = calloc(sizeof(mcReader),1);
    if (r == NULL)
        return NULL;

    r->err = 0;
    r->errstr[0] = '\0';
    r->buf = sdsempty();
    r->maxbuf = MC_READER_MAX_BUF;
    if (r->buf == NULL) {
        free(r);
        return NULL;
    }

    r->subreply = NULL;
    r->alloc_len = 0;
    r->elements = 0;
    r->element = NULL;

    r->state = 0;
    r->token = NULL;

    r->str = NULL;
    r->strlen = 0;
    r->kflags = 0;
    r->kversion = -1;
    r->integer = 0;
    r->type = RSP_TYPE_UNKNOWN;
    r->result = PARSE_OK;

    r->fn = fn;
    
    return r;
}

void memcachedReaderFree(mcReader *r) 
{
    memcachedReaderReset(r);
    
    if (r->buf != NULL)
        sdsfree(r->buf);
    free(r);
}

int memcachedReaderFeed(mcReader *r, const char *buf, size_t len) 
{
    sds newbuf;

    /* Return early when this reader is in an erroneous state. */
    if (r->err)
        return MC_ERR;

    /* Copy the provided buffer. */
    if (buf != NULL && len >= 1) {
        /* Destroy internal buffer when it is empty and is quite large. */
        if (r->len == 0 && r->maxbuf != 0 && sdsavail(r->buf) > r->maxbuf) {
            sdsfree(r->buf);
            r->buf = sdsempty();
            r->pos = 0;

            /* r->buf should not be NULL since we just free'd a larger one. */
            assert(r->buf != NULL);
        }

        newbuf = sdscatlen(r->buf,buf,len);
        if (newbuf == NULL) {
            __memcachedReaderSetErrorOOM(r);
            return MC_ERR;
        }

        r->buf = newbuf;
        r->len = sdslen(r->buf);
    }

    return MC_OK;
}

static void memcachedReaderReset(mcReader *r) 
{
    r->str = NULL;
    r->strlen = 0;
    r->kflags = 0;
    r->kversion = -1;

    r->state = 0;
    r->token = 0;
 
    r->integer = 0;

    r->type = RSP_TYPE_UNKNOWN;
    r->result = PARSE_OK;
    
    if (r->subreply != NULL) {
        if (r->fn && r->fn->freeObject)
            r->fn->freeObject(r->subreply);
        
        r->subreply = NULL;
    }

    elementArrayDestroy(r);

    r->err = 0;
    r->errstr[0] = '\0';
}

static void *getReplyFromReader(mcReader *r)
{
    void *reply;

    switch (r->type) {
        case RSP_TYPE_VALUE:
            if (r->element) {
                assert(r->subreply == NULL);
                if (r->fn && r->fn->createArray) {
                    reply = r->fn->createArray(r->elements,r->element);
                    r->element = NULL;
                    r->elements = 0;
                    r->alloc_len = 0;
                } else {
                    reply = (void*)MC_REPLY_ARRAY;
                }
            } else if (r->subreply) {
                reply = r->subreply;
            }
            break;
        case RSP_TYPE_NUM:
            if (r->fn && r->fn->createInteger)
                reply = r->fn->createInteger(r->integer);
            else
                reply = (void*)MC_REPLY_INTEGER;
            break;
        case RSP_TYPE_END:
            if (r->fn && r->fn->createNil)
                reply = r->fn->createNil();
            else
                reply = (void*)MC_REPLY_NIL;
            break;
        case RSP_TYPE_CLIENT_ERROR:
        case RSP_TYPE_SERVER_ERROR:
            if (r->fn && r->fn->createString)
                reply = r->fn->createString(MC_REPLY_ERROR,
                    NULL,0,r->str,r->strlen,0,0);
            else
                reply = (void*)MC_REPLY_ERROR;
            break;
        case RSP_TYPE_ERROR:
            if (r->fn && r->fn->createString)
                reply = r->fn->createString(MC_REPLY_ERROR,
                    NULL,0,"",0,0,0);
            else
                reply = (void*)MC_REPLY_ERROR;
            break;
        case RSP_TYPE_STORED:
        case RSP_TYPE_NOT_STORED:
        case RSP_TYPE_EXISTS:
        case RSP_TYPE_NOT_FOUND:
        case RSP_TYPE_DELETED:
            if (r->fn && r->fn->createString)
                reply = r->fn->createString(MC_REPLY_STATUS,
                    NULL,0,r->str,r->strlen,0,0);
            else
                reply = (void*)MC_REPLY_STATUS;
            break;
        default:
            reply = NULL;
            break;
    }
    
    return reply;
}

int memcachedReaderGetReply(mcReader *r, void **reply) {
    /* Default target pointer to NULL. */
    if (reply != NULL)
        *reply = NULL;

    /* Return early when this reader is in an erroneous state. */
    if (r->err)
        return MC_ERR;

    /* When the buffer is empty, there will never be a reply. */
    if (r->len == 0)
        return MC_OK;

    memcachedParseResponse(r);

    /* Return ASAP when an error occurred. */
    if (r->err)
        return MC_ERR;

    /*
    printf("!######### r->result: %d, r->state: %d, r->type: %d, r->pos: %d, r->len: %d," 
        "r->kflags: %d, r->kversion : %lld, r->strlen: %zu, r->integer: %lld r->buf: %s, r->str: %s\n", 
        r->result, r->state, r->type, r->pos, r->len, r->kflags, r->kversion, 
        r->strlen, r->integer, r->buf, r->str);
        */
    /* Emit a reply when there is one. */
    if (r->result == PARSE_OK) {
        if (reply != NULL) {
            *reply = getReplyFromReader(r);
        }
        memcachedReaderReset(r);
    }

    /* Discard part of the buffer when we've consumed at least 1k, to avoid
     * doing unnecessary calls to memmove() in sds.c. */
    if (r->pos >= 1024 && r->token == NULL && r->str == NULL) {
        sdsrange(r->buf,r->pos,-1);
        r->pos = 0;
        r->len = sdslen(r->buf);
    }

    return MC_OK;
}


================================================
FILE: dep/himemcached-0.1.0/himcread.h
================================================
#ifndef _HIMC_READ_H_
#define _HIMC_READ_H_
#include <stdio.h> /* for size_t */

#include <himcread.h>

#define MC_ERR   -1
#define MC_OK    0

/* When an error occurs, the err flag in a context is set to hold the type of
 * error that occured. REDIS_ERR_IO means there was an I/O error and you
 * should use the "errno" variable to find out what is wrong.
 * For other values, the "errstr" field will hold a description. */
#define MC_ERR_IO 1 /* Error in read or write */
#define MC_ERR_EOF 3 /* End of file */
#define MC_ERR_PROTOCOL 4 /* Protocol error */
#define MC_ERR_OOM 5 /* Out of memory */
#define MC_ERR_OTHER 2 /* Everything else... */

#define MC_REPLY_STRING     1
#define MC_REPLY_ARRAY      2
#define MC_REPLY_INTEGER    3
#define MC_REPLY_NIL        4
#define MC_REPLY_STATUS     5
#define MC_REPLY_ERROR      6

#define MC_READER_MAX_BUF (1024*16)  /* Default max unused reader buffer. */

#ifdef __cplusplus
extern "C" {
#endif

typedef struct mcReplyObjectFunctions {
    void *(*createString)(int, char*, size_t, char*, size_t, int, long long);
    void *(*createArray)(size_t, void **);
    void *(*createInteger)(long long);
    void *(*createNil)(void);
    void (*freeObject)(void*);
} mcReplyObjectFunctions;

typedef struct mcReader {
    int err; /* Error flags, 0 when there is no error */
    char errstr[128]; /* String representation of error when applicable */

    char *buf; /* Read buffer */
    size_t pos; /* Buffer cursor */
    size_t len; /* Buffer length */
    size_t maxbuf; /* Max length of unused buffer */

    void *subreply; /* Temporary reply for array type */
    size_t alloc_len; /* Temporary reply array alloc length */
    size_t elements; /* Temporary reply array length */
    void **element; /* Temporary reply array */

    char *str;
    size_t strlen;
    int kflags;  /* Used for key flags (get/gets command reply) */
    long long kversion;  /* Used for key version (gets command reply) */

    int state;  /* Current parser state */
    char *token;    /* Token marker */

    long long integer; /* Cache the integer if need */

    int type;   /* Response type */
    int result; /* Parsing result */

    mcReplyObjectFunctions *fn;
    void *privdata;
} mcReader;

/* Public API for the protocol parser. */
mcReader *memcachedReaderCreateWithFunctions(mcReplyObjectFunctions *fn);
void memcachedReaderFree(mcReader *r);
int memcachedReaderFeed(mcReader *r, const char *buf, size_t len);
int memcachedReaderGetReply(mcReader *r, void **reply);

#ifdef __cplusplus
}
#endif

#endif


================================================
FILE: dep/himemcached-0.1.0/himemcached.c
================================================
#include <stdlib.h>
#include <errno.h>
#include <assert.h>

#include "himemcached.h"

#define REQ_TYPE_UNKNOWN        0
#define REQ_TYPE_STORAGE        1
#define REQ_TYPE_CAS            2
#define REQ_TYPE_RETRIEVAL      3
#define REQ_TYPE_ARITHMETIC     4
#define REQ_TYPE_DELETE         5

static mcReply *createReplyObject(int type);
static void *createStringObject(int type, char *key, size_t keylen, char *str, size_t len, int flags, long long version);
static void *createArrayObject(size_t elements, void **element);
static void *createIntegerObject(long long value);
static void *createNilObject(void);

/* Default set of functions to build the reply. Keep in mind that such a
 * function returning NULL is interpreted as OOM. */
static mcReplyObjectFunctions defaultFunctions = {
    createStringObject,
    createArrayObject,
    createIntegerObject,
    createNilObject,
    freeMcReplyObject
};

/* Create a reply object */
static mcReply *createReplyObject(int type) {
    mcReply *r = calloc(1,sizeof(*r));

    if (r == NULL)
        return NULL;

    r->type = type;
    
    return r;
}

/* Free a reply object */
void freeMcReplyObject(void *reply) {
    mcReply *r = reply;
    size_t j;

    if (r == NULL)
        return;

    switch(r->type) {
    case MC_REPLY_INTEGER:
    case MC_REPLY_NIL:
        break; /* Nothing to free */
    case MC_REPLY_ARRAY:
        if (r->element != NULL) {
            for (j = 0; j < r->elements; j++)
                if (r->element[j] != NULL)
                    freeMcReplyObject(r->element[j]);
            free(r->element);
        }
        break;
    case MC_REPLY_ERROR:
    case MC_REPLY_STATUS:
    case MC_REPLY_STRING:
        if (r->key != NULL)
            free(r->key);
        if (r->str != NULL)
            free(r->str);
        break;
    default:
        assert(0);
        break;
    }
    free(r);
}

static void *createStringObject(int type, char *key, size_t keylen, char *str, size_t len, int flags, long long version) {
    mcReply *r, *parent;
    char *buf;

    assert(type == MC_REPLY_ERROR  ||
           type == MC_REPLY_STATUS ||
           type == MC_REPLY_STRING);

    r = createReplyObject(type);
    if (r == NULL)
        return NULL;

    if (key != NULL) {
        r->key = malloc(keylen+1);
        if (r->key == NULL) {
            freeMcReplyObject(r);
            return NULL;
        }
        if (keylen > 0)
            /* Copy string value */
            memcpy(r->key,key,keylen);
        r->key[keylen] = '\0';
        r->keylen = keylen;
    }

    buf = malloc(len+1);
    if (buf == NULL) {
        freeMcReplyObject(r);
        return NULL;
    }
    if (len > 0)
        /* Copy string value */
        memcpy(buf,str,len);
    buf[len] = '\0';
    r->str = buf;
    r->len = len;

    r->flags = flags;
    r->version = version;
    
    return r;
}

static void *createArrayObject(size_t elements, void **element) {
    mcReply *r;

    r = createReplyObject(MC_REPLY_ARRAY);
    if (r == NULL)
        return NULL;

    r->elements = elements;
    r->element = (mcReply **)element;

    return r;
}

static void *createIntegerObject(long long value) {
    mcReply *r;

    r = createReplyObject(MC_REPLY_INTEGER);
    if (r == NULL)
        return NULL;

    r->integer = value;
    
    return r;
}

static void *createNilObject(void) {
    mcReply *r;

    r = createReplyObject(MC_REPLY_NIL);
    if (r == NULL)
        return NULL;

    return r;
}

void __memcachedSetError(mcContext *c, int type, const char *str) {
    size_t len;

    c->err = type;
    if (str != NULL) {
        len = strlen(str);
        len = len < (sizeof(c->errstr)-1) ? len : (sizeof(c->errstr)-1);
        memcpy(c->errstr,str,len);
        c->errstr[len] = '\0';
    } else {
        /* Only REDIS_ERR_IO may lack a description! */
        assert(type == MC_ERR_IO);
        //__redis_strerror_r(errno, c->errstr, sizeof(c->errstr));
    }
}


/* Write the output buffer to the socket.
 *
 * Returns MC_OK when the buffer is empty, or (a part of) the buffer was
 * succesfully written to the socket. When the buffer is empty after the
 * write operation, "done" is set to 1 (if given).
 *
 * Returns MC_ERR if an error occured trying to write and sets
 * c->errstr to hold the appropriate error string.
 */
int memcachedBufferWrite(mcContext *c, int *done) {
    int nwritten;

    /* Return early when the context has seen an error. */
    if (c->err)
        return MC_ERR;

    if (sdslen(c->obuf) > 0) {
        nwritten = write(c->fd,c->obuf,sdslen(c->obuf));
        if (nwritten == -1) {
            if ((errno == EAGAIN && !(c->flags & MC_BLOCK)) || (errno == EINTR)) {
                /* Try again later */
            } else {
                __memcachedSetError(c,MC_ERR_IO,NULL);
                return MC_ERR;
            }
        } else if (nwritten > 0) {
            if (nwritten == (signed)sdslen(c->obuf)) {
                sdsfree(c->obuf);
                c->obuf = sdsempty();
            } else {
                sdsrange(c->obuf,nwritten,-1);
            }
        }
    }
    if (done != NULL) *done = (sdslen(c->obuf) == 0);
    return MC_OK;
}

/* Internal helper function to try and get a reply from the reader,
 * or set an error in the context otherwise. */
int memcachedGetReplyFromReader(mcContext *c, void **reply) {
    if (memcachedReaderGetReply(c->reader,reply) == MC_ERR) {
        __memcachedSetError(c,c->reader->err,c->reader->errstr);
        return MC_ERR;
    }
    return MC_OK;
}

int memcachedGetReply(mcContext *c, void **reply) {
    int wdone = 0;
    void *aux = NULL;

    /* Try to read pending replies */
    if (memcachedGetReplyFromReader(c,&aux) == MC_ERR)
        return MC_ERR;

    /* For the blocking context, flush output buffer and read reply */
    if (aux == NULL && c->flags & MC_BLOCK) {
        /* Write until done */
        do {
            if (memcachedBufferWrite(c,&wdone) == MC_ERR)
                return MC_ERR;
        } while (!wdone);

        /* Read until there is a reply */
        do {
            if (memcachedBufferRead(c) == MC_ERR)
                return MC_ERR;
            if (memcachedGetReplyFromReader(c,&aux) == MC_ERR)
                return MC_ERR;
        } while (aux == NULL);
    }

    /* Set reply object */
    if (reply != NULL) *reply = aux;
    return MC_OK;
}

mcReader *memcachedReaderCreate(void) {
    return memcachedReaderCreateWithFunctions(&defaultFunctions);
}

mcContext *memcachedContextInit(void) {
    mcContext *c;

    c = calloc(1,sizeof(mcContext));
    if (c == NULL)
        return NULL;

    c->err = 0;
    c->errstr[0] = '\0';
    c->obuf = sdsempty();
    c->reader = memcachedReaderCreate();
    c->tcp.host = NULL;
    c->tcp.source_addr = NULL;
    c->unix_sock.path = NULL;
    c->timeout = NULL;

    if (c->obuf == NULL || c->reader == NULL) {
        memcachedFree(c);
        return NULL;
    }

    return c;
}

void memcachedFree(mcContext *c) {
    if (c == NULL)
        return;
    if (c->fd > 0)
        close(c->fd);
    if (c->obuf != NULL)
        sdsfree(c->obuf);
    if (c->reader != NULL)
        memcachedReaderFree(c->reader);
    if (c->tcp.host)
        free(c->tcp.host);
    if (c->tcp.source_addr)
        free(c->tcp.source_addr);
    if (c->unix_sock.path)
        free(c->unix_sock.path);
    if (c->timeout)
        free(c->timeout);
    free(c);
}

/* Use this function to handle a read event on the descriptor. It will try
 * and read some bytes from the socket and feed them to the reply parser.
 *
 * After this function is called, you may use memcachedContextReadReply to
 * see if there is a reply available. */
int memcachedBufferRead(mcContext *c) {
    char buf[1024*16];
    int nread;

    /* Return early when the context has seen an error. */
    if (c->err)
        return MC_ERR;

    nread = read(c->fd,buf,sizeof(buf));
    if (nread == -1) {
        if ((errno == EAGAIN && !(c->flags & MC_BLOCK)) || (errno == EINTR)) {
            /* Try again later */
        } else {
            __memcachedSetError(c,MC_ERR_IO,NULL);
            return MC_ERR;
        }
    } else if (nread == 0) {
        __memcachedSetError(c,MC_ERR_EOF,"Server closed the connection");
        return MC_ERR;
    } else {
        if (memcachedReaderFeed(c->reader,buf,nread) != MC_OK) {
            __memcachedSetError(c,c->reader->err,c->reader->errstr);
            return MC_ERR;
        }
    }
    return MC_OK;
}

static int getRequestTypeFromString(char *str, size_t len)
{
    if (str == NULL || len == 0)
        return -1;

    if (len == 3) {
        if (!strncasecmp(str,"set",3) || 
            !strncasecmp(str,"add",3)) {
            return REQ_TYPE_STORAGE;
        } else if (!strncasecmp(str,"cas",3)) {
            return REQ_TYPE_CAS;
        } else if (!strncasecmp(str,"get",3)) {
            return REQ_TYPE_RETRIEVAL;
        } else {
            return -1;
        }
    } else if (len == 4) {
        if (!strncasecmp(str,"gets",4)) {
            return REQ_TYPE_RETRIEVAL;
        } else if (!strncasecmp(str,"incr",4) || 
            !strncasecmp(str,"decr",4)) {
            return REQ_TYPE_ARITHMETIC;
        } else {
            return -1;
        }
    } else if (len == 6) {
        if (!strncasecmp(str,"append",6)) {
            return REQ_TYPE_STORAGE;
        } else if (!strncasecmp(str,"delete",6)) {
            return REQ_TYPE_DELETE;
        } else {
            return -1;
        }
    } else if (len == 7) {
        if (!strncasecmp(str,"replace",7) || 
            !strncasecmp(str,"prepend",7)) {
            return REQ_TYPE_STORAGE;
        } else {
            return -1;
        }
    }

    return -1;
}

#define ARGUMENTLEN(_argtype,_argv,_argvlen,_idx) \
    (_argtype==0?sdslen(_argv[_idx]):(_argvlen==NULL?strlen(_argv[_idx]):_argvlen[_idx]))

/* argtype==0 : argv is sds array 
 * argtype==1 : argv is c-string array and an array with their lengths. 
 * If the length array is set to NULL, strlen will be used to compute the
 * argument lengths.
 */
static int checkCmdValidAndGetTotalLen(int cmdtype, int argtype, int argc, char **argv, size_t *argvlen)
{
    size_t len;
    int totlen, j;
    
    switch (cmdtype) {
        case REQ_TYPE_STORAGE:
            if (argc != 6 && argc != 7) {
                return -1;
            }
            if (argc == 7 && (ARGUMENTLEN(argtype,argv,argvlen,5) != 7 || 
                strncasecmp(argv[5],"noreply",7))) {
                return -1;
            }

            totlen = 0;
            for (j = 0; j < argc-1; j ++) {
                totlen += ARGUMENTLEN(argtype,argv,argvlen,j) + 1;
            }
            totlen += 2 + ARGUMENTLEN(argtype,argv,argvlen,argc-1) + 2;
            break;
        case REQ_TYPE_CAS:
            if (argc != 7 && argc != 8) {
                return -1;
            }
            if (argc == 8 && (ARGUMENTLEN(argtype,argv,argvlen,6) != 7 || 
                strncasecmp(argv[6],"noreply",7))) {
                return -1;
            }

            totlen = 0;
            for (j = 0; j < argc-1; j ++) {
                totlen += ARGUMENTLEN(argtype,argv,argvlen,j) + 1;
            }
            totlen += 2 + ARGUMENTLEN(argtype,argv,argvlen,argc-1) + 2;
            break;
        case REQ_TYPE_ARITHMETIC:
            if (argc != 3) {
                return -1;
            }
            totlen = ARGUMENTLEN(argtype,argv,argvlen,0) + 1 + 
                ARGUMENTLEN(argtype,argv,argvlen,1) + 1 + 
                ARGUMENTLEN(argtype,argv,argvlen,2) + 2;
            break;
        case REQ_TYPE_RETRIEVAL:
            if (argc <= 1) {
                return -1;
            }

            totlen = 0;
            for (j = 0; j < argc-1; j ++) {
                totlen += ARGUMENTLEN(argtype,argv,argvlen,j) + 1;
            }
            totlen += ARGUMENTLEN(argtype,argv,argvlen,argc-1) + 2;
            break;
        case REQ_TYPE_DELETE:
            if (argc != 2 && argc != 3) {
                return -1;
            }
            
            totlen = ARGUMENTLEN(argtype,argv,argvlen,0) + 1 + 
                ARGUMENTLEN(argtype,argv,argvlen,1);
            if (argc == 3) {
                if (strncasecmp(argv[2],"noreply",7)) {
                    return -1;
                }
                totlen += 1 + ARGUMENTLEN(argtype,argv,argvlen,2);
            }
            totlen += 2;
            break;
        default:
            totlen = -1;
            break;
    }

    return totlen;
}

/* Like the checkCmdValidAndGetTotalLen() function */
static int genericMemcachedCommand(int cmdtype, char *cmd, int argtype, int argc, char **argv, size_t *argvlen)
{
    int j;
    size_t len;
    int pos = 0; /* position in final command */
    
    switch (cmdtype) {
        case REQ_TYPE_STORAGE:
        case REQ_TYPE_CAS:
            for (j = 0; j < argc-1; j ++) {
                len = ARGUMENTLEN(argtype,argv,argvlen,j);
                memcpy(cmd+pos,argv[j],len);
                pos += (int)len;
                cmd[pos++] = ' ';
            }
            cmd[pos++] = '\r';
            cmd[pos++] = '\n';
            len = ARGUMENTLEN(argtype,argv,argvlen,argc-1);
            memcpy(cmd+pos,argv[argc-1],len);
            pos += (int)len;
            cmd[pos++] = '\r';
            cmd[pos++] = '\n';
            break;
        case REQ_TYPE_ARITHMETIC:
        case REQ_TYPE_RETRIEVAL:
        case REQ_TYPE_DELETE:
            for (j = 0; j < argc-1; j ++) {
                len = ARGUMENTLEN(argtype,argv,argvlen,j);
                memcpy(cmd+pos,argv[j],len);
                pos += len;
                cmd[pos++] = ' ';
            }
            len = ARGUMENTLEN(argtype,argv,argvlen,argc-1);
            memcpy(cmd+pos,argv[argc-1],len);
            pos += (int)len;
            cmd[pos++] = '\r';
            cmd[pos++] = '\n';
            break;
        default:
            pos = -1;
            break;
    }

    return pos;
}

/* Format a command according to the Memcached protocol. This function
 * takes the number of arguments, an array with arguments and an sds array. 
 */
int memcachedFormatCommandSdsArgv(char **target, int argc, const sds *argv) {
    char *cmd = NULL; /* final command */
    int pos; /* position in final command */
    int totlen;
    int type;

    /* Abort on a NULL target */
    if (target == NULL || argc < 1)
        return -1;

    type = getRequestTypeFromString(argv[0], sdslen(argv[0]));
    if (type < 0)
        goto format_err;

    totlen = checkCmdValidAndGetTotalLen(type, 0, argc, argv, NULL);
    if (totlen < 0) {
        goto format_err;
    }

    /* Build the command at protocol level */
    cmd = malloc(totlen+1);
    if (cmd == NULL) goto memory_err;

    pos = genericMemcachedCommand(type, cmd, 0, argc, argv, NULL);
    if (pos < 0) goto format_err;
    
    assert(pos == totlen);
    cmd[pos] = '\0';

    *target = cmd;
    return totlen;

format_err:
    if (cmd) free(cmd);
    return -2;

memory_err:
    return -1;
}

int memcachedvFormatCommand(char **target, const char *format, va_list ap)
{
    const char *c = format;
    char *cmd = NULL; /* final command */
    int pos; /* position in final command */
    sds curarg, newarg; /* current argument */
    int touched = 0; /* was the current argument touched? */
    char **curargv = NULL, **newargv = NULL;
    int argc = 0;
    int totlen;
    int error_type = 0; /* 0 = no error; -1 = memory error; -2 = format error */
    int j;

    /* Abort if there is not target to set */
    if (target == NULL)
        return -1;

    /* Build the command string accordingly to protocol */
    curarg = sdsempty();
    if (curarg == NULL)
        return -1;

    while(*c != '\0') {
        if (*c != '%' || c[1] == '\0') {
            if (*c == ' ') {
                if (touched) {
                    newargv = realloc(curargv,sizeof(char*)*(argc+1));
                    if (newargv == NULL) goto memory_err;
                    curargv = newargv;
                    curargv[argc++] = curarg;

                    /* curarg is put in argv so it can be overwritten. */
                    curarg = sdsempty();
                    if (curarg == NULL) goto memory_err;
                    touched = 0;
                }
            } else {
                newarg = sdscatlen(curarg,c,1);
                if (newarg == NULL) goto memory_err;
                curarg = newarg;
                touched = 1;
            }
        } else {
            char *arg;
            size_t size;

            /* Set newarg so it can be checked even if it is not touched. */
            newarg = curarg;

            switch(c[1]) {
            case 's':
                arg = va_arg(ap,char*);
                size = strlen(arg);
                if (size > 0)
                    newarg = sdscatlen(curarg,arg,size);
                break;
            case 'b':
                arg = va_arg(ap,char*);
                size = va_arg(ap,size_t);
                if (size > 0)
                    newarg = sdscatlen(curarg,arg,size);
                break;
            case '%':
                newarg = sdscat(curarg,"%");
                break;
            default:
                /* Try to detect printf format */
                {
                    static const char intfmts[] = "diouxX";
                    static const char flags[] = "#0-+ ";
                    char _format[16];
                    const char *_p = c+1;
                    size_t _l = 0;
                    va_list _cpy;

                    /* Flags */
                    while (*_p != '\0' && strchr(flags,*_p) != NULL) _p++;

                    /* Field width */
                    while (*_p != '\0' && isdigit(*_p)) _p++;

                    /* Precision */
                    if (*_p == '.') {
                        _p++;
                        while (*_p != '\0' && isdigit(*_p)) _p++;
                    }

                    /* Copy va_list before consuming with va_arg */
                    va_copy(_cpy,ap);

                    /* Integer conversion (without modifiers) */
                    if (strchr(intfmts,*_p) != NULL) {
                        va_arg(ap,int);
                        goto fmt_valid;
                    }

                    /* Double conversion (without modifiers) */
                    if (strchr("eEfFgGaA",*_p) != NULL) {
                        va_arg(ap,double);
                        goto fmt_valid;
                    }

                    /* Size: char */
                    if (_p[0] == 'h' && _p[1] == 'h') {
                        _p += 2;
                        if (*_p != '\0' && strchr(intfmts,*_p) != NULL) {
                            va_arg(ap,int); /* char gets promoted to int */
                            goto fmt_valid;
                        }
                        goto fmt_invalid;
                    }

                    /* Size: short */
                    if (_p[0] == 'h') {
                        _p += 1;
                        if (*_p != '\0' && strchr(intfmts,*_p) != NULL) {
                            va_arg(ap,int); /* short gets promoted to int */
                            goto fmt_valid;
                        }
                        goto fmt_invalid;
                    }

                    /* Size: long long */
                    if (_p[0] == 'l' && _p[1] == 'l') {
                        _p += 2;
                        if (*_p != '\0' && strchr(intfmts,*_p) != NULL) {
                            va_arg(ap,long long);
                            goto fmt_valid;
                        }
                        goto fmt_invalid;
                    }

                    /* Size: long */
                    if (_p[0] == 'l') {
                        _p += 1;
                        if (*_p != '\0' && strchr(intfmts,*_p) != NULL) {
                            va_arg(ap,long);
                            goto fmt_valid;
                        }
                        goto fmt_invalid;
                    }

                fmt_invalid:
                    va_end(_cpy);
                    goto format_err;

                fmt_valid:
                    _l = (_p+1)-c;
                    if (_l < sizeof(_format)-2) {
                        memcpy(_format,c,_l);
                        _format[_l] = '\0';
                        newarg = sdscatvprintf(curarg,_format,_cpy);

                        /* Update current position (note: outer blocks
                         * increment c twice so compensate here) */
                        c = _p-1;
                    }

                    va_end(_cpy);
                    break;
                }
            }

            if (newarg == NULL) goto memory_err;
            curarg = newarg;

            touched = 1;
            c++;
        }
        c++;
    }

    /* Add the last argument if needed */
    if (touched) {
        newargv = realloc(curargv,sizeof(char*)*(argc+1));
        if (newargv == NULL) goto memory_err;
        curargv = newargv;
        curargv[argc++] = curarg;
    } else {
        sdsfree(curarg);
    }

    /* Clear curarg because it was put in curargv or was free'd. */
    curarg = NULL;

    totlen = memcachedFormatCommandSdsArgv(&cmd, argc,curargv);
    if (totlen < 0) {
        error_type = totlen;
        goto cleanup;
    }

    free(curargv);
    *target = cmd;
    return totlen;

format_err:
    error_type = -2;
    goto cleanup;

memory_err:
    error_type = -1;
    goto cleanup;

cleanup:
    if (curargv) {
        while(argc--)
            sdsfree(curargv[argc]);
        free(curargv);
    }

    sdsfree(curarg);

    /* No need to check cmd since it is the last statement that can fail,
     * but do it anyway to be as defensive as possible. */
    if (cmd != NULL)
        free(cmd);

    return error_type;
}

/* Format a command according to the Memcached protocol. This function
 * takes a format similar to printf:
 *
 * %s represents a C null terminated string you want to interpolate
 * %b represents a binary safe string
 *
 * When using %b you need to provide both the pointer to the string
 * and the length in bytes as a size_t. Examples:
 *
 * len = memcachedFormatCommand(target, "GET %s", mykey);
 * len = memcachedFormatCommand(target, "SET %s %d, %lld %zu %s", mykey, myflags, myexptime, myvallen, myval);
 */
int memcachedFormatCommand(char **target, const char *format, ...) {
    va_list ap;
    int len;
    va_start(ap,format);
    len = memcachedvFormatCommand(target,format,ap);
    va_end(ap);

    /* The API says "-1" means bad result, but we now also return "-2" in some
     * cases.  Force the return value to always be -1. */
    if (len < 0)
        len = -1;

    return len;
}

/* Format a command according to the Redis protocol. This function takes the
 * number of arguments, an array with arguments and an array with their
 * lengths. If the latter is set to NULL, strlen will be used to compute the
 * argument lengths.
 */
int memcachedFormatCommandArgv(char **target, int argc, const char **argv, const size_t *argvlen) {
    char *cmd = NULL; /* final command */
    int pos; /* position in final command */
    int totlen;
    int type;

    /* Abort on a NULL target */
    if (target == NULL || argc < 1)
        return -1;

    type = getRequestTypeFromString(argv[0], argvlen==NULL?strlen(argv[0]):argvlen[0]);
    if (type < 0) {
        goto format_err;
    }

    totlen = checkCmdValidAndGetTotalLen(type, 1, argc, argv, argvlen);
    if (totlen < 0) {
        goto format_err;
    }

    /* Build the command at protocol level */
    cmd = malloc(totlen+1);
    if (cmd == NULL) goto memory_err;

    pos = genericMemcachedCommand(type, cmd, 1, argc, argv, argvlen);
    if (pos < 0) {
        goto format_err;
    }
    
    assert(pos == totlen);
    cmd[pos] = '\0';

    *target = cmd;
    return totlen;

format_err:
    if (cmd) free(cmd);
    return -2;

memory_err:
    return -1;
}


================================================
FILE: dep/himemcached-0.1.0/himemcached.h
================================================
#ifndef _HIMEMCACHED_H_
#define _HIMEMCACHED_H_

#include "himcread.h"
#include "himcdep/sds.h"

#define HIMC_MAJOR 0
#define HIMC_MINOR 13
#define HIMC_PATCH 1

/* Connection type can be blocking or non-blocking and is set in the
 * least significant bit of the flags field in redisContext. */
#define MC_BLOCK 0x1

/* Connection may be disconnected before being free'd. The second bit
 * in the flags field is set when the context is connected. */
#define MC_CONNECTED 0x2

/* The async API might try to disconnect cleanly and flush the output
 * buffer and read all subsequent replies before disconnecting.
 * This flag means no new commands can come in and the connection
 * should be terminated once all replies have been read. */
#define MC_DISCONNECTING 0x4

/* Flag specific to the async API which means that the context should be clean
 * up as soon as possible. */
#define MC_FREEING 0x8

/* Flag that is set when an async callback is executed. */
#define MC_IN_CALLBACK 0x10

/* Flag that is set when the async context has one or more subscriptions. */
#define MC_SUBSCRIBED 0x20

/* Flag that is set when monitor mode is active */
#define MC_MONITORING 0x40

/* Flag that is set when we should set SO_REUSEADDR before calling bind() */
#define MC_REUSEADDR 0x80

#define MC_KEEPALIVE_INTERVAL 15 /* seconds */

/* number of times we retry to connect in the case of EADDRNOTAVAIL and
 * SO_REUSEADDR is being used. */
#define MC_CONNECT_RETRIES  10

/* This is the reply object returned by memcachedCommand() */
typedef struct mcReply {
    int type; /* MC_REPLY_* */
    long long integer; /* The integer when type is MC_REPLY_INTEGER */
    int keylen; /* Length of key */
    char *key;  /* Key string */
    int len; /* Length of string */
    char *str; /* Used for both REDIS_REPLY_ERROR and MC_REPLY_STRING */
    int flags;
    long long version;
    size_t elements; /* number of elements, for MC_REPLY_ARRAY */
    struct mcReply **element; /* elements vector for MC_REPLY_ARRAY */
} mcReply;

mcReader *memcachedReaderCreate(void);

/* Function to free the reply objects hiredis returns by default. */
void freeMcReplyObject(void *reply);

enum mcConnectionType {
    MC_CONN_TCP,
    MC_CONN_UNIX,
};

/* Context for a connection to Memcached */
typedef struct mcContext {
    int err; /* Error flags, 0 when there is no error */
    char errstr[128]; /* String representation of error when applicable */
    int fd;
    int flags;
    char *obuf; /* Write buffer */
    mcReader *reader; /* Protocol reader */

    enum mcConnectionType connection_type;
    struct timeval *timeout;

    struct {
        char *host;
        char *source_addr;
        int port;
    } tcp;

    struct {
        char *path;
    } unix_sock;
} mcContext;

int memcachedBufferWrite(mcContext *c, int *done);
int memcachedBufferRead(mcContext *c);

int memcachedGetReplyFromReader(mcContext *c, void **reply);
int memcachedGetReply(mcContext *c, void **reply);

mcContext *memcachedContextInit(void);
void memcachedFree(mcContext *c) ;

int memcachedFormatCommandSdsArgv(char **target, int argc, const sds *argv);
int memcachedvFormatCommand(char **target, const char *format, va_list ap);
int memcachedFormatCommand(char **target, const char *format, ...);
int memcachedFormatCommandArgv(char **target, int argc, const char **argv, const size_t *argvlen);

#endif /* _HIMEMCACHED_H_ */


================================================
FILE: dep/hiredis-0.13.3/.gitignore
================================================


================================================
FILE: dep/jemalloc-4.2.0/.gitignore
================================================


================================================
FILE: dep/sds/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CPPFLAGS =
if !OS_SOLARIS
AM_CPPFLAGS += -D_GNU_SOURCE
endif
AM_CPPFLAGS += -I $(top_srcdir)/dep/util
AM_CPPFLAGS += -I $(top_srcdir)/dep/jemalloc-4.2.0/include
AM_CPPFLAGS += -I $(top_srcdir)/dep/dmalloc

AM_CFLAGS = -Wall -Wshadow
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value

noinst_LIBRARIES = libsds.a

noinst_HEADERS = sds.h sdsalloc.h

libsds_a_SOURCES =      \
    sdsalloc.h          \
	sds.c sds.h

================================================
FILE: dep/sds/sds.c
================================================
/* SDSLib 2.0 -- A C dynamic strings library
 *
 * Copyright (c) 2006-2015, Salvatore Sanfilippo <antirez at gmail dot com>
 * Copyright (c) 2015, Oran Agra
 * Copyright (c) 2015, Redis Labs, Inc
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <assert.h>

#include <sds.h>
#include <sdsalloc.h>

static inline int sdsHdrSize(char type) {
    switch(type&SDS_TYPE_MASK) {
        case SDS_TYPE_5:
            return sizeof(struct sdshdr5);
        case SDS_TYPE_8:
            return sizeof(struct sdshdr8);
        case SDS_TYPE_16:
            return sizeof(struct sdshdr16);
        case SDS_TYPE_32:
            return sizeof(struct sdshdr32);
        case SDS_TYPE_64:
            return sizeof(struct sdshdr64);
    }
    return 0;
}

static inline char sdsReqType(size_t string_size) {
    if (string_size < 32)
        return SDS_TYPE_5;
    if (string_size < 0xff)
        return SDS_TYPE_8;
    if (string_size < 0xffff)
        return SDS_TYPE_16;
    if (string_size < 0xffffffff)
        return SDS_TYPE_32;
    return SDS_TYPE_64;
}

/* Create a new sds string with the content specified by the 'init' pointer
 * and 'initlen'.
 * If NULL is used for 'init' the string is initialized with zero bytes.
 *
 * The string is always null-termined (all the sds strings are, always) so
 * even if you create an sds string with:
 *
 * mystring = sdsnewlen("abc",3);
 *
 * You can print the string with printf() as there is an implicit \0 at the
 * end of the string. However the string is binary safe and can contain
 * \0 characters in the middle, as the length is stored in the sds header. */
sds sdsnewlen(const void *init, size_t initlen) {
    void *sh;
    sds s;
    char type = sdsReqType(initlen);
    /* Empty strings are usually created in order to append. Use type 8
     * since type 5 is not good at this. */
    if (type == SDS_TYPE_5 && initlen == 0) type = SDS_TYPE_8;
    int hdrlen = sdsHdrSize(type);
    unsigned char *fp; /* flags pointer. */

    sh = s_malloc(hdrlen+initlen+1);
    if (!init)
        memset(sh, 0, hdrlen+initlen+1);
    if (sh == NULL) return NULL;
    s = (char*)sh+hdrlen;
    fp = ((unsigned char*)s)-1;
    switch(type) {
        case SDS_TYPE_5: {
            *fp = type | (initlen << SDS_TYPE_BITS);
            break;
        }
        case SDS_TYPE_8: {
            SDS_HDR_VAR(8,s);
            sh->len = initlen;
            sh->alloc = initlen;
            *fp = type;
            break;
        }
        case SDS_TYPE_16: {
            SDS_HDR_VAR(16,s);
            sh->len = initlen;
            sh->alloc = initlen;
            *fp = type;
            break;
        }
        case SDS_TYPE_32: {
            SDS_HDR_VAR(32,s);
            sh->len = initlen;
            sh->alloc = initlen;
            *fp = type;
            break;
        }
        case SDS_TYPE_64: {
            SDS_HDR_VAR(64,s);
            sh->len = initlen;
            sh->alloc = initlen;
            *fp = type;
            break;
        }
    }
    if (initlen && init)
        memcpy(s, init, initlen);
    s[initlen] = '\0';
    return s;
}

/* Create an empty (zero length) sds string. Even in this case the string
 * always has an implicit null term. */
sds sdsempty(void) {
    return sdsnewlen("",0);
}

/* Create a new sds string starting from a null terminated C string. */
sds sdsnew(const char *init) {
    size_t initlen = (init == NULL) ? 0 : strlen(init);
    return sdsnewlen(init, initlen);
}

/* Duplicate an sds string. */
sds sdsdup(const sds s) {
    return sdsnewlen(s, sdslen(s));
}

/* Free an sds string. No operation is performed if 's' is NULL. */
void sdsfree(sds s) {
    if (s == NULL) return;
    s_free((char*)s-sdsHdrSize(s[-1]));
}

/* Set the sds string length to the length as obtained with strlen(), so
 * considering as content only up to the first null term character.
 *
 * This function is useful when the sds string is hacked manually in some
 * way, like in the following example:
 *
 * s = sdsnew("foobar");
 * s[2] = '\0';
 * sdsupdatelen(s);
 * printf("%d\n", sdslen(s));
 *
 * The output will be "2", but if we comment out the call to sdsupdatelen()
 * the output will be "6" as the string was modified but the logical length
 * remains 6 bytes. */
void sdsupdatelen(sds s) {
    int reallen = strlen(s);
    sdssetlen(s, reallen);
}

/* Modify an sds string in-place to make it empty (zero length).
 * However all the existing buffer is not discarded but set as free space
 * so that next append operations will not require allocations up to the
 * number of bytes previously available. */
void sdsclear(sds s) {
    sdssetlen(s, 0);
    s[0] = '\0';
}

/* Enlarge the free space at the end of the sds string so that the caller
 * is sure that after calling this function can overwrite up to addlen
 * bytes after the end of the string, plus one more byte for nul term.
 *
 * Note: this does not change the *length* of the sds string as returned
 * by sdslen(), but only the free buffer space we have. */
sds sdsMakeRoomFor(sds s, size_t addlen) {
    void *sh, *newsh;
    size_t avail = sdsavail(s);
    size_t len, newlen;
    char type, oldtype = s[-1] & SDS_TYPE_MASK;
    int hdrlen;

    /* Return ASAP if there is enough space left. */
    if (avail >= addlen) return s;

    len = sdslen(s);
    sh = (char*)s-sdsHdrSize(oldtype);
    newlen = (len+addlen);
    if (newlen < SDS_MAX_PREALLOC)
        newlen *= 2;
    else
        newlen += SDS_MAX_PREALLOC;

    type = sdsReqType(newlen);

    /* Don't use type 5: the user is appending to the string and type 5 is
     * not able to remember empty space, so sdsMakeRoomFor() must be called
     * at every appending operation. */
    if (type == SDS_TYPE_5) type = SDS_TYPE_8;

    hdrlen = sdsHdrSize(type);
    if (oldtype==type) {
        newsh = s_realloc(sh, hdrlen+newlen+1);
        if (newsh == NULL) return NULL;
        s = (char*)newsh+hdrlen;
    } else {
        /* Since the header size changes, need to move the string forward,
         * and can't use realloc */
        newsh = s_malloc(hdrlen+newlen+1);
        if (newsh == NULL) return NULL;
        memcpy((char*)newsh+hdrlen, s, len+1);
        s_free(sh);
        s = (char*)newsh+hdrlen;
        s[-1] = type;
        sdssetlen(s, len);
    }
    sdssetalloc(s, newlen);
    return s;
}

/* Reallocate the sds string so that it has no free space at the end. The
 * contained string remains not altered, but next concatenation operations
 * will require a reallocation.
 *
 * After the call, the passed sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdsRemoveFreeSpace(sds s) {
    void *sh, *newsh;
    char type, oldtype = s[-1] & SDS_TYPE_MASK;
    int hdrlen;
    size_t len = sdslen(s);
    sh = (char*)s-sdsHdrSize(oldtype);

    type = sdsReqType(len);
    hdrlen = sdsHdrSize(type);
    if (oldtype==type) {
        newsh = s_realloc(sh, hdrlen+len+1);
        if (newsh == NULL) return NULL;
        s = (char*)newsh+hdrlen;
    } else {
        newsh = s_malloc(hdrlen+len+1);
        if (newsh == NULL) return NULL;
        memcpy((char*)newsh+hdrlen, s, len+1);
        s_free(sh);
        s = (char*)newsh+hdrlen;
        s[-1] = type;
        sdssetlen(s, len);
    }
    sdssetalloc(s, len);
    return s;
}

/* Return the total size of the allocation of the specifed sds string,
 * including:
 * 1) The sds header before the pointer.
 * 2) The string.
 * 3) The free buffer at the end if any.
 * 4) The implicit null term.
 */
size_t sdsAllocSize(sds s) {
    size_t alloc = sdsalloc(s);
    return sdsHdrSize(s[-1])+alloc+1;
}

/* Return the pointer of the actual SDS allocation (normally SDS strings
 * are referenced by the start of the string buffer). */
void *sdsAllocPtr(sds s) {
    return (void*) (s-sdsHdrSize(s[-1]));
}

/* Increment the sds length and decrements the left free space at the
 * end of the string according to 'incr'. Also set the null term
 * in the new end of the string.
 *
 * This function is used in order to fix the string length after the
 * user calls sdsMakeRoomFor(), writes something after the end of
 * the current string, and finally needs to set the new length.
 *
 * Note: it is possible to use a negative increment in order to
 * right-trim the string.
 *
 * Usage example:
 *
 * Using sdsIncrLen() and sdsMakeRoomFor() it is possible to mount the
 * following schema, to cat bytes coming from the kernel to the end of an
 * sds string without copying into an intermediate buffer:
 *
 * oldlen = sdslen(s);
 * s = sdsMakeRoomFor(s, BUFFER_SIZE);
 * nread = read(fd, s+oldlen, BUFFER_SIZE);
 * ... check for nread <= 0 and handle it ...
 * sdsIncrLen(s, nread);
 */
void sdsIncrLen(sds s, int incr) {
    unsigned char flags = s[-1];
    size_t len;
    switch(flags&SDS_TYPE_MASK) {
        case SDS_TYPE_5: {
            unsigned char *fp = ((unsigned char*)s)-1;
            unsigned char oldlen = SDS_TYPE_5_LEN(flags);
            assert((incr > 0 && oldlen+incr < 32) || (incr < 0 && oldlen >= (unsigned int)(-incr)));
            *fp = SDS_TYPE_5 | ((oldlen+incr) << SDS_TYPE_BITS);
            len = oldlen+incr;
            break;
        }
        case SDS_TYPE_8: {
            SDS_HDR_VAR(8,s);
            assert((incr >= 0 && sh->alloc-sh->len >= incr) || (incr < 0 && sh->len >= (unsigned int)(-incr)));
            len = (sh->len += incr);
            break;
        }
        case SDS_TYPE_16: {
            SDS_HDR_VAR(16,s);
            assert((incr >= 0 && sh->alloc-sh->len >= incr) || (incr < 0 && sh->len >= (unsigned int)(-incr)));
            len = (sh->len += incr);
            break;
        }
        case SDS_TYPE_32: {
            SDS_HDR_VAR(32,s);
            assert((incr >= 0 && sh->alloc-sh->len >= (unsigned int)incr) || (incr < 0 && sh->len >= (unsigned int)(-incr)));
            len = (sh->len += incr);
            break;
        }
        case SDS_TYPE_64: {
            SDS_HDR_VAR(64,s);
            assert((incr >= 0 && sh->alloc-sh->len >= (uint64_t)incr) || (incr < 0 && sh->len >= (uint64_t)(-incr)));
            len = (sh->len += incr);
            break;
        }
        default: len = 0; /* Just to avoid compilation warnings. */
    }
    s[len] = '\0';
}

/* Grow the sds to have the specified length. Bytes that were not part of
 * the original length of the sds will be set to zero.
 *
 * if the specified length is smaller than the current length, no operation
 * is performed. */
sds sdsgrowzero(sds s, size_t len) {
    size_t curlen = sdslen(s);

    if (len <= curlen) return s;
    s = sdsMakeRoomFor(s,len-curlen);
    if (s == NULL) return NULL;

    /* Make sure added region doesn't contain garbage */
    memset(s+curlen,0,(len-curlen+1)); /* also set trailing \0 byte */
    sdssetlen(s, len);
    return s;
}

/* Append the specified binary-safe string pointed by 't' of 'len' bytes to the
 * end of the specified sds string 's'.
 *
 * After the call, the passed sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdscatlen(sds s, const void *t, size_t len) {
    size_t curlen = sdslen(s);

    s = sdsMakeRoomFor(s,len);
    if (s == NULL) return NULL;
    memcpy(s+curlen, t, len);
    sdssetlen(s, curlen+len);
    s[curlen+len] = '\0';
    return s;
}

/* Append the specified null termianted C string to the sds string 's'.
 *
 * After the call, the passed sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdscat(sds s, const char *t) {
    return sdscatlen(s, t, strlen(t));
}

/* Append the specified sds 't' to the existing sds 's'.
 *
 * After the call, the modified sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdscatsds(sds s, const sds t) {
    return sdscatlen(s, t, sdslen(t));
}

/* Destructively modify the sds string 's' to hold the specified binary
 * safe string pointed by 't' of length 'len' bytes. */
sds sdscpylen(sds s, const char *t, size_t len) {
    if (sdsalloc(s) < len) {
        s = sdsMakeRoomFor(s,len-sdslen(s));
        if (s == NULL) return NULL;
    }
    memcpy(s, t, len);
    s[len] = '\0';
    sdssetlen(s, len);
    return s;
}

/* Like sdscpylen() but 't' must be a null-termined string so that the length
 * of the string is obtained with strlen(). */
sds sdscpy(sds s, const char *t) {
    return sdscpylen(s, t, strlen(t));
}

/* Helper for sdscatlonglong() doing the actual number -> string
 * conversion. 's' must point to a string with room for at least
 * SDS_LLSTR_SIZE bytes.
 *
 * The function returns the length of the null-terminated string
 * representation stored at 's'. */
#define SDS_LLSTR_SIZE 21
int sdsll2str(char *s, long long value) {
    char *p, aux;
    unsigned long long v;
    size_t l;

    /* Generate the string representation, this method produces
     * an reversed string. */
    v = (value < 0) ? -value : value;
    p = s;
    do {
        *p++ = '0'+(v%10);
        v /= 10;
    } while(v);
    if (value < 0) *p++ = '-';

    /* Compute length and add null term. */
    l = p-s;
    *p = '\0';

    /* Reverse the string. */
    p--;
    while(s < p) {
        aux = *s;
        *s = *p;
        *p = aux;
        s++;
        p--;
    }
    return l;
}

/* Identical sdsll2str(), but for unsigned long long type. */
int sdsull2str(char *s, unsigned long long v) {
    char *p, aux;
    size_t l;

    /* Generate the string representation, this method produces
     * an reversed string. */
    p = s;
    do {
        *p++ = '0'+(v%10);
        v /= 10;
    } while(v);

    /* Compute length and add null term. */
    l = p-s;
    *p = '\0';

    /* Reverse the string. */
    p--;
    while(s < p) {
        aux = *s;
        *s = *p;
        *p = aux;
        s++;
        p--;
    }
    return l;
}

/* Create an sds string from a long long value. It is much faster than:
 *
 * sdscatprintf(sdsempty(),"%lld\n", value);
 */
sds sdsfromlonglong(long long value) {
    char buf[SDS_LLSTR_SIZE];
    int len = sdsll2str(buf,value);

    return sdsnewlen(buf,len);
}

/* Like sdscatprintf() but gets va_list instead of being variadic. */
sds sdscatvprintf(sds s, const char *fmt, va_list ap) {
    va_list cpy;
    char staticbuf[1024], *buf = staticbuf, *t;
    size_t buflen = strlen(fmt)*2;

    /* We try to start using a static buffer for speed.
     * If not possible we revert to heap allocation. */
    if (buflen > sizeof(staticbuf)) {
        buf = s_malloc(buflen);
        if (buf == NULL) return NULL;
    } else {
        buflen = sizeof(staticbuf);
    }

    /* Try with buffers two times bigger every time we fail to
     * fit the string in the current buffer size. */
    while(1) {
        buf[buflen-2] = '\0';
        va_copy(cpy,ap);
        vsnprintf(buf, buflen, fmt, cpy);
        va_end(cpy);
        if (buf[buflen-2] != '\0') {
            if (buf != staticbuf) s_free(buf);
            buflen *= 2;
            buf = s_malloc(buflen);
            if (buf == NULL) return NULL;
            continue;
        }
        break;
    }

    /* Finally concat the obtained string to the SDS string and return it. */
    t = sdscat(s, buf);
    if (buf != staticbuf) s_free(buf);
    return t;
}

/* Append to the sds string 's' a string obtained using printf-alike format
 * specifier.
 *
 * After the call, the modified sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call.
 *
 * Example:
 *
 * s = sdsnew("Sum is: ");
 * s = sdscatprintf(s,"%d+%d = %d",a,b,a+b).
 *
 * Often you need to create a string from scratch with the printf-alike
 * format. When this is the need, just use sdsempty() as the target string:
 *
 * s = sdscatprintf(sdsempty(), "... your format ...", args);
 */
sds sdscatprintf(sds s, const char *fmt, ...) {
    va_list ap;
    char *t;
    va_start(ap, fmt);
    t = sdscatvprintf(s,fmt,ap);
    va_end(ap);
    return t;
}

/* This function is similar to sdscatprintf, but much faster as it does
 * not rely on sprintf() family functions implemented by the libc that
 * are often very slow. Moreover directly handling the sds string as
 * new data is concatenated provides a performance improvement.
 *
 * However this function only handles an incompatible subset of printf-alike
 * format specifiers:
 *
 * %s - C String
 * %S - SDS string
 * %i - signed int
 * %I - 64 bit signed integer (long long, int64_t)
 * %u - unsigned int
 * %U - 64 bit unsigned integer (unsigned long long, uint64_t)
 * %% - Verbatim "%" character.
 */
sds sdscatfmt(sds s, char const *fmt, ...) {
    size_t initlen = sdslen(s);
    const char *f = fmt;
    int i;
    va_list ap;

    va_start(ap,fmt);
    f = fmt;    /* Next format specifier byte to process. */
    i = initlen; /* Position of the next byte to write to dest str. */
    while(*f) {
        char next, *str;
        size_t l;
        long long num;
        unsigned long long unum;

        /* Make sure there is always space for at least 1 char. */
        if (sdsavail(s)==0) {
            s = sdsMakeRoomFor(s,1);
        }

        switch(*f) {
        case '%':
            next = *(f+1);
            f++;
            switch(next) {
            case 's':
            case 'S':
                str = va_arg(ap,char*);
                l = (next == 's') ? strlen(str) : sdslen(str);
                if (sdsavail(s) < l) {
                    s = sdsMakeRoomFor(s,l);
                }
                memcpy(s+i,str,l);
                sdsinclen(s,l);
                i += l;
                break;
            case 'i':
            case 'I':
                if (next == 'i')
                    num = va_arg(ap,int);
                else
                    num = va_arg(ap,long long);
                {
                    char buf[SDS_LLSTR_SIZE];
                    l = sdsll2str(buf,num);
                    if (sdsavail(s) < l) {
                        s = sdsMakeRoomFor(s,l);
                    }
                    memcpy(s+i,buf,l);
                    sdsinclen(s,l);
                    i += l;
                }
                break;
            case 'u':
            case 'U':
                if (next == 'u')
                    unum = va_arg(ap,unsigned int);
                else
                    unum = va_arg(ap,unsigned long long);
                {
                    char buf[SDS_LLSTR_SIZE];
                    l = sdsull2str(buf,unum);
                    if (sdsavail(s) < l) {
                        s = sdsMakeRoomFor(s,l);
                    }
                    memcpy(s+i,buf,l);
                    sdsinclen(s,l);
                    i += l;
                }
                break;
            default: /* Handle %% and generally %<unknown>. */
                s[i++] = next;
                sdsinclen(s,1);
                break;
            }
            break;
        default:
            s[i++] = *f;
            sdsinclen(s,1);
            break;
        }
        f++;
    }
    va_end(ap);

    /* Add null-term */
    s[i] = '\0';
    return s;
}

/* Remove the part of the string from left and from right composed just of
 * contiguous characters found in 'cset', that is a null terminted C string.
 *
 * After the call, the modified sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call.
 *
 * Example:
 *
 * s = sdsnew("AA...AA.a.aa.aHelloWorld     :::");
 * s = sdstrim(s,"Aa. :");
 * printf("%s\n", s);
 *
 * Output will be just "Hello World".
 */
sds sdstrim(sds s, const char *cset) {
    char *start, *end, *sp, *ep;
    size_t len;

    sp = start = s;
    ep = end = s+sdslen(s)-1;
    while(sp <= end && strchr(cset, *sp)) sp++;
    while(ep > sp && strchr(cset, *ep)) ep--;
    len = (sp > ep) ? 0 : ((ep-sp)+1);
    if (s != sp) memmove(s, sp, len);
    s[len] = '\0';
    sdssetlen(s,len);
    return s;
}

/* Turn the string into a smaller (or equal) string containing only the
 * substring specified by the 'start' and 'end' indexes.
 *
 * start and end can be negative, where -1 means the last character of the
 * string, -2 the penultimate character, and so forth.
 *
 * The interval is inclusive, so the start and end characters will be part
 * of the resulting string.
 *
 * The string is modified in-place.
 *
 * Example:
 *
 * s = sdsnew("Hello World");
 * sdsrange(s,1,-1); => "ello World"
 */
void sdsrange(sds s, int start, int end) {
    size_t newlen, len = sdslen(s);

    if (len == 0) return;
    if (start < 0) {
        start = len+start;
        if (start < 0) start = 0;
    }
    if (end < 0) {
        end = len+end;
        if (end < 0) end = 0;
    }
    newlen = (start > end) ? 0 : (end-start)+1;
    if (newlen != 0) {
        if (start >= (signed)len) {
            newlen = 0;
        } else if (end >= (signed)len) {
            end = len-1;
            newlen = (start > end) ? 0 : (end-start)+1;
        }
    } else {
        start = 0;
    }
    if (start && newlen) memmove(s, s+start, newlen);
    s[newlen] = 0;
    sdssetlen(s,newlen);
}

/* Apply tolower() to every character of the sds string 's'. */
void sdstolower(sds s) {
    int len = sdslen(s), j;

    for (j = 0; j < len; j++) s[j] = tolower(s[j]);
}

/* Apply toupper() to every character of the sds string 's'. */
void sdstoupper(sds s) {
    int len = sdslen(s), j;

    for (j = 0; j < len; j++) s[j] = toupper(s[j]);
}

/* Compare two sds strings s1 and s2 with memcmp().
 *
 * Return value:
 *
 *     positive if s1 > s2.
 *     negative if s1 < s2.
 *     0 if s1 and s2 are exactly the same binary string.
 *
 * If two strings share exactly the same prefix, but one of the two has
 * additional characters, the longer string is considered to be greater than
 * the smaller one. */
int sdscmp(const sds s1, const sds s2) {
    size_t l1, l2, minlen;
    int cmp;

    l1 = sdslen(s1);
    l2 = sdslen(s2);
    minlen = (l1 < l2) ? l1 : l2;
    cmp = memcmp(s1,s2,minlen);
    if (cmp == 0) return l1-l2;
    return cmp;
}

/* Split 's' with separator in 'sep'. An array
 * of sds strings is returned. *count will be set
 * by reference to the number of tokens returned.
 *
 * On out of memory, zero length string, zero length
 * separator, NULL is returned.
 *
 * Note that 'sep' is able to split a string using
 * a multi-character separator. For example
 * sdssplit("foo_-_bar","_-_"); will return two
 * elements "foo" and "bar".
 *
 * This version of the function is binary-safe but
 * requires length arguments. sdssplit() is just the
 * same function but for zero-terminated strings.
 */
sds *sdssplitlen(const char *s, int len, const char *sep, int seplen, int *count) {
    int elements = 0, slots = 5, start = 0, j;
    sds *tokens;

    if (seplen < 1 || len < 0) return NULL;

    tokens = s_malloc(sizeof(sds)*slots);
    if (tokens == NULL) return NULL;

    if (len == 0) {
        *count = 0;
        return tokens;
    }
    for (j = 0; j < (len-(seplen-1)); j++) {
        /* make sure there is room for the next element and the final one */
        if (slots < elements+2) {
            sds *newtokens;

            slots *= 2;
            newtokens = s_realloc(tokens,sizeof(sds)*slots);
            if (newtokens == NULL) goto cleanup;
            tokens = newtokens;
        }
        /* search the separator */
        if ((seplen == 1 && *(s+j) == sep[0]) || (memcmp(s+j,sep,seplen) == 0)) {
            tokens[elements] = sdsnewlen(s+start,j-start);
            if (tokens[elements] == NULL) goto cleanup;
            elements++;
            start = j+seplen;
            j = j+seplen-1; /* skip the separator */
        }
    }
    /* Add the final element. We are sure there is room in the tokens array. */
    tokens[elements] = sdsnewlen(s+start,len-start);
    if (tokens[elements] == NULL) goto cleanup;
    elements++;
    *count = elements;
    return tokens;

cleanup:
    {
        int i;
        for (i = 0; i < elements; i++) sdsfree(tokens[i]);
        s_free(tokens);
        *count = 0;
        return NULL;
    }
}

/* Free the result returned by sdssplitlen(), or do nothing if 'tokens' is NULL. */
void sdsfreesplitres(sds *tokens, int count) {
    if (!tokens) return;
    while(count--)
        sdsfree(tokens[count]);
    s_free(tokens);
}

/* Append to the sds string "s" an escaped string representation where
 * all the non-printable characters (tested with isprint()) are turned into
 * escapes in the form "\n\r\a...." or "\x<hex-number>".
 *
 * After the call, the modified sds string is no longer valid and all the
 * references must be substituted with the new pointer returned by the call. */
sds sdscatrepr(sds s, const char *p, size_t len) {
    s = sdscatlen(s,"\"",1);
    while(len--) {
        switch(*p) {
        case '\\':
        case '"':
            s = sdscatprintf(s,"\\%c",*p);
            break;
        case '\n': s = sdscatlen(s,"\\n",2); break;
        case '\r': s = sdscatlen(s,"\\r",2); break;
        case '\t': s = sdscatlen(s,"\\t",2); break;
        case '\a': s = sdscatlen(s,"\\a",2); break;
        case '\b': s = sdscatlen(s,"\\b",2); break;
        default:
            if (isprint(*p))
                s = sdscatprintf(s,"%c",*p);
            else
                s = sdscatprintf(s,"\\x%02x",(unsigned char)*p);
            break;
        }
        p++;
    }
    return sdscatlen(s,"\"",1);
}

/* Helper function for sdssplitargs() that returns non zero if 'c'
 * is a valid hex digit. */
int is_hex_digit(char c) {
    return (c >= '0' && c <= '9') || (c >= 'a' && c <= 'f') ||
           (c >= 'A' && c <= 'F');
}

/* Helper function for sdssplitargs() that converts a hex digit into an
 * integer from 0 to 15 */
int hex_digit_to_int(char c) {
    switch(c) {
    case '0': return 0;
    case '1': return 1;
    case '2': return 2;
    case '3': return 3;
    case '4': return 4;
    case '5': return 5;
    case '6': return 6;
    case '7': return 7;
    case '8': return 8;
    case '9': return 9;
    case 'a': case 'A': return 10;
    case 'b': case 'B': return 11;
    case 'c': case 'C': return 12;
    case 'd': case 'D': return 13;
    case 'e': case 'E': return 14;
    case 'f': case 'F': return 15;
    default: return 0;
    }
}

/* Split a line into arguments, where every argument can be in the
 * following programming-language REPL-alike form:
 *
 * foo bar "newline are supported\n" and "\xff\x00otherstuff"
 *
 * The number of arguments is stored into *argc, and an array
 * of sds is returned.
 *
 * The caller should free the resulting array of sds strings with
 * sdsfreesplitres().
 *
 * Note that sdscatrepr() is able to convert back a string into
 * a quoted string in the same format sdssplitargs() is able to parse.
 *
 * The function returns the allocated tokens on success, even when the
 * input string is empty, or NULL if the input contains unbalanced
 * quotes or closed quotes followed by non space characters
 * as in: "foo"bar or "foo'
 */
sds *sdssplitargs(const char *line, int *argc) {
    const char *p = line;
    char *current = NULL;
    char **vector = NULL;

    *argc = 0;
    while(1) {
        /* skip blanks */
        while(*p && isspace(*p)) p++;
        if (*p) {
            /* get a token */
            int inq=0;  /* set to 1 if we are in "quotes" */
            int insq=0; /* set to 1 if we are in 'single quotes' */
            int done=0;

            if (current == NULL) current = sdsempty();
            while(!done) {
                if (inq) {
                    if (*p == '\\' && *(p+1) == 'x' &&
                                             is_hex_digit(*(p+2)) &&
                                             is_hex_digit(*(p+3)))
                    {
                        unsigned char byte;

                        byte = (hex_digit_to_int(*(p+2))*16)+
                                hex_digit_to_int(*(p+3));
                        current = sdscatlen(current,(char*)&byte,1);
                        p += 3;
                    } else if (*p == '\\' && *(p+1)) {
                        char c;

                        p++;
                        switch(*p) {
                        case 'n': c = '\n'; break;
                        case 'r': c = '\r'; break;
                        case 't': c = '\t'; break;
                        case 'b': c = '\b'; break;
                        case 'a': c = '\a'; break;
                        default: c = *p; break;
                        }
                        current = sdscatlen(current,&c,1);
                    } else if (*p == '"') {
                        /* closing quote must be followed by a space or
                         * nothing at all. */
                        if (*(p+1) && !isspace(*(p+1))) goto err;
                        done=1;
                    } else if (!*p) {
                        /* unterminated quotes */
                        goto err;
                    } else {
                        current = sdscatlen(current,p,1);
                    }
                } else if (insq) {
                    if (*p == '\\' && *(p+1) == '\'') {
                        p++;
                        current = sdscatlen(current,"'",1);
                    } else if (*p == '\'') {
                        /* closing quote must be followed by a space or
                         * nothing at all. */
                        if (*(p+1) && !isspace(*(p+1))) goto err;
                        done=1;
                    } else if (!*p) {
                        /* unterminated quotes */
                        goto err;
                    } else {
                        current = sdscatlen(current,p,1);
                    }
                } else {
                    switch(*p) {
                    case ' ':
                    case '\n':
                    case '\r':
                    case '\t':
                    case '\0':
                        done=1;
                        break;
                    case '"':
                        inq=1;
                        break;
                    case '\'':
                        insq=1;
                        break;
                    default:
                        current = sdscatlen(current,p,1);
                        break;
                    }
                }
                if (*p) p++;
            }
            /* add the token to the vector */
            vector = s_realloc(vector,((*argc)+1)*sizeof(char*));
            vector[*argc] = current;
            (*argc)++;
            current = NULL;
        } else {
            /* Even on empty input string return something not NULL. */
            if (vector == NULL) vector = s_malloc(sizeof(void*));
            return vector;
        }
    }

err:
    while((*argc)--)
        sdsfree(vector[*argc]);
    s_free(vector);
    if (current) sdsfree(current);
    *argc = 0;
    return NULL;
}

/* Modify the string substituting all the occurrences of the set of
 * characters specified in the 'from' string to the corresponding character
 * in the 'to' array.
 *
 * For instance: sdsmapchars(mystring, "ho", "01", 2)
 * will have the effect of turning the string "hello" into "0ell1".
 *
 * The function returns the sds string pointer, that is always the same
 * as the input pointer since no resize is needed. */
sds sdsmapchars(sds s, const char *from, const char *to, size_t setlen) {
    size_t j, i, l = sdslen(s);

    for (j = 0; j < l; j++) {
        for (i = 0; i < setlen; i++) {
            if (s[j] == from[i]) {
                s[j] = to[i];
                break;
            }
        }
    }
    return s;
}

/* Join an array of C strings using the specified separator (also a C string).
 * Returns the result as an sds string. */
sds sdsjoin(char **argv, int argc, char *sep) {
    sds join = sdsempty();
    int j;

    for (j = 0; j < argc; j++) {
        join = sdscat(join, argv[j]);
        if (j != argc-1) join = sdscat(join,sep);
    }
    return join;
}

/* Like sdsjoin, but joins an array of SDS strings. */
sds sdsjoinsds(sds *argv, int argc, const char *sep, size_t seplen) {
    sds join = sdsempty();
    int j;

    for (j = 0; j < argc; j++) {
        join = sdscatsds(join, argv[j]);
        if (j != argc-1) join = sdscatlen(join,sep,seplen);
    }
    return join;
}

int sdsIsNum(sds s) {
    size_t i;
    
    if (s == NULL || sdslen(s) == 0) {
        return 0;
    }

    for (i = 0; i < sdslen(s); i ++) {
        if(*(s+i) < '0' || *(s+i) > '9'){
            return 0;
        }
    }

    return 1;
}

/* Wrappers to the allocators used by SDS. Note that SDS will actually
 * just use the macros defined into sdsalloc.h in order to avoid to pay
 * the overhead of function calls. Here we define these wrappers only for
 * the programs SDS is linked to, if they want to touch the SDS internals
 * even if they use a different allocator. */
void *sds_malloc(size_t size) { return s_malloc(size); }
void *sds_realloc(void *ptr, size_t size) { return s_realloc(ptr,size); }
void sds_free(void *ptr) { s_free(ptr); }

#if defined(SDS_TEST_MAIN)
#include <stdio.h>
#include "testhelp.h"
#include "limits.h"

#define UNUSED(x) (void)(x)
int sdsTest(void) {
    {
        sds x = sdsnew("foo"), y;

        test_cond("Create a string and obtain the length",
            sdslen(x) == 3 && memcmp(x,"foo\0",4) == 0)

        sdsfree(x);
        x = sdsnewlen("foo",2);
        test_cond("Create a string with specified length",
            sdslen(x) == 2 && memcmp(x,"fo\0",3) == 0)

        x = sdscat(x,"bar");
        test_cond("Strings concatenation",
            sdslen(x) == 5 && memcmp(x,"fobar\0",6) == 0);

        x = sdscpy(x,"a");
        test_cond("sdscpy() against an originally longer string",
            sdslen(x) == 1 && memcmp(x,"a\0",2) == 0)

        x = sdscpy(x,"xyzxxxxxxxxxxyyyyyyyyyykkkkkkkkkk");
        test_cond("sdscpy() against an originally shorter string",
            sdslen(x) == 33 &&
            memcmp(x,"xyzxxxxxxxxxxyyyyyyyyyykkkkkkkkkk\0",33) == 0)

        sdsfree(x);
        x = sdscatprintf(sdsempty(),"%d",123);
        test_cond("sdscatprintf() seems working in the base case",
            sdslen(x) == 3 && memcmp(x,"123\0",4) == 0)

        sdsfree(x);
        x = sdsnew("--");
        x = sdscatfmt(x, "Hello %s World %I,%I--", "Hi!", LLONG_MIN,LLONG_MAX);
        test_cond("sdscatfmt() seems working in the base case",
            sdslen(x) == 60 &&
            memcmp(x,"--Hello Hi! World -9223372036854775808,"
                     "9223372036854775807--",60) == 0)
        printf("[%s]\n",x);

        sdsfree(x);
        x = sdsnew("--");
        x = sdscatfmt(x, "%u,%U--", UINT_MAX, ULLONG_MAX);
        test_cond("sdscatfmt() seems working with unsigned numbers",
            sdslen(x) == 35 &&
            memcmp(x,"--4294967295,18446744073709551615--",35) == 0)

        sdsfree(x);
        x = sdsnew(" x ");
        sdstrim(x," x");
        test_cond("sdstrim() works when all chars match",
            sdslen(x) == 0)

        sdsfree(x);
        x = sdsnew(" x ");
        sdstrim(x," ");
        test_cond("sdstrim() works when a single char remains",
            sdslen(x) == 1 && x[0] == 'x')

        sdsfree(x);
        x = sdsnew("xxciaoyyy");
        sdstrim(x,"xy");
        test_cond("sdstrim() correctly trims characters",
            sdslen(x) == 4 && memcmp(x,"ciao\0",5) == 0)

        y = sdsdup(x);
        sdsrange(y,1,1);
        test_cond("sdsrange(...,1,1)",
            sdslen(y) == 1 && memcmp(y,"i\0",2) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,1,-1);
        test_cond("sdsrange(...,1,-1)",
            sdslen(y) == 3 && memcmp(y,"iao\0",4) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,-2,-1);
        test_cond("sdsrange(...,-2,-1)",
            sdslen(y) == 2 && memcmp(y,"ao\0",3) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,2,1);
        test_cond("sdsrange(...,2,1)",
            sdslen(y) == 0 && memcmp(y,"\0",1) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,1,100);
        test_cond("sdsrange(...,1,100)",
            sdslen(y) == 3 && memcmp(y,"iao\0",4) == 0)

        sdsfree(y);
        y = sdsdup(x);
        sdsrange(y,100,100);
        test_cond("sdsrange(...,100,100)",
            sdslen(y) == 0 && memcmp(y,"\0",1) == 0)

        sdsfree(y);
        sdsfree(x);
        x = sdsnew("foo");
        y = sdsnew("foa");
        test_cond("sdscmp(foo,foa)", sdscmp(x,y) > 0)

        sdsfree(y);
        sdsfree(x);
        x = sdsnew("bar");
        y = sdsnew("bar");
        test_cond("sdscmp(bar,bar)", sdscmp(x,y) == 0)

        sdsfree(y);
        sdsfree(x);
        x = sdsnew("aar");
        y = sdsnew("bar");
        test_cond("sdscmp(bar,bar)", sdscmp(x,y) < 0)

        sdsfree(y);
        sdsfree(x);
        x = sdsnewlen("\a\n\0foo\r",7);
        y = sdscatrepr(sdsempty(),x,sdslen(x));
        test_cond("sdscatrepr(...data...)",
            memcmp(y,"\"\\a\\n\\x00foo\\r\"",15) == 0)

        {
            unsigned int oldfree;
            char *p;
            int step = 10, j, i;

            sdsfree(x);
            sdsfree(y);
            x = sdsnew("0");
            test_cond("sdsnew() free/len buffers", sdslen(x) == 1 && sdsavail(x) == 0);

            /* Run the test a few times in order to hit the first two
             * SDS header types. */
            for (i = 0; i < 10; i++) {
                int oldlen = sdslen(x);
                x = sdsMakeRoomFor(x,step);
                int type = x[-1]&SDS_TYPE_MASK;

                test_cond("sdsMakeRoomFor() len", sdslen(x) == oldlen);
                if (type != SDS_TYPE_5) {
                    test_cond("sdsMakeRoomFor() free", sdsavail(x) >= step);
                    oldfree = sdsavail(x);
                }
                p = x+oldlen;
                for (j = 0; j < step; j++) {
                    p[j] = 'A'+j;
                }
                sdsIncrLen(x,step);
            }
            test_cond("sdsMakeRoomFor() content",
                memcmp("0ABCDEFGHIJABCDEFGHIJABCDEFGHIJABCDEFGHIJABCDEFGHIJABCDEFGHIJABCDEFGHIJABCDEFGHIJABCDEFGHIJABCDEFGHIJ",x,101) == 0);
            test_cond("sdsMakeRoomFor() final length",sdslen(x)==101);

            sdsfree(x);
        }
    }
    test_report()
    return 0;
}
#endif

#ifdef SDS_TEST_MAIN
int main(void) {
    return sdsTest();
}
#endif


================================================
FILE: dep/sds/sds.h
================================================
/* SDSLib 2.0 -- A C dynamic strings library
 *
 * Copyright (c) 2006-2015, Salvatore Sanfilippo <antirez at gmail dot com>
 * Copyright (c) 2015, Oran Agra
 * Copyright (c) 2015, Redis Labs, Inc
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#ifndef __SDS_H
#define __SDS_H

#define SDS_MAX_PREALLOC (1024*1024)

#include <sys/types.h>
#include <stdarg.h>
#include <stdint.h>

typedef char *sds;

/* Note: sdshdr5 is never used, we just access the flags byte directly.
 * However is here to document the layout of type 5 SDS strings. */
struct __attribute__ ((__packed__)) sdshdr5 {
    unsigned char flags; /* 3 lsb of type, and 5 msb of string length */
    char buf[];
};
struct __attribute__ ((__packed__)) sdshdr8 {
    uint8_t len; /* used */
    uint8_t alloc; /* excluding the header and null terminator */
    unsigned char flags; /* 3 lsb of type, 5 unused bits */
    char buf[];
};
struct __attribute__ ((__packed__)) sdshdr16 {
    uint16_t len; /* used */
    uint16_t alloc; /* excluding the header and null terminator */
    unsigned char flags; /* 3 lsb of type, 5 unused bits */
    char buf[];
};
struct __attribute__ ((__packed__)) sdshdr32 {
    uint32_t len; /* used */
    uint32_t alloc; /* excluding the header and null terminator */
    unsigned char flags; /* 3 lsb of type, 5 unused bits */
    char buf[];
};
struct __attribute__ ((__packed__)) sdshdr64 {
    uint64_t len; /* used */
    uint64_t alloc; /* excluding the header and null terminator */
    unsigned char flags; /* 3 lsb of type, 5 unused bits */
    char buf[];
};

#define SDS_TYPE_5  0
#define SDS_TYPE_8  1
#define SDS_TYPE_16 2
#define SDS_TYPE_32 3
#define SDS_TYPE_64 4
#define SDS_TYPE_MASK 7
#define SDS_TYPE_BITS 3
#define SDS_HDR_VAR(T,s) struct sdshdr##T *sh = (void*)((s)-(sizeof(struct sdshdr##T)));
#define SDS_HDR(T,s) ((struct sdshdr##T *)((s)-(sizeof(struct sdshdr##T))))
#define SDS_TYPE_5_LEN(f) ((f)>>SDS_TYPE_BITS)

static inline size_t sdslen(const sds s) {
    unsigned char flags = s[-1];
    switch(flags&SDS_TYPE_MASK) {
        case SDS_TYPE_5:
            return SDS_TYPE_5_LEN(flags);
        case SDS_TYPE_8:
            return SDS_HDR(8,s)->len;
        case SDS_TYPE_16:
            return SDS_HDR(16,s)->len;
        case SDS_TYPE_32:
            return SDS_HDR(32,s)->len;
        case SDS_TYPE_64:
            return SDS_HDR(64,s)->len;
    }
    return 0;
}

static inline size_t sdsavail(const sds s) {
    unsigned char flags = s[-1];
    switch(flags&SDS_TYPE_MASK) {
        case SDS_TYPE_5: {
            return 0;
        }
        case SDS_TYPE_8: {
            SDS_HDR_VAR(8,s);
            return sh->alloc - sh->len;
        }
        case SDS_TYPE_16: {
            SDS_HDR_VAR(16,s);
            return sh->alloc - sh->len;
        }
        case SDS_TYPE_32: {
            SDS_HDR_VAR(32,s);
            return sh->alloc - sh->len;
        }
        case SDS_TYPE_64: {
            SDS_HDR_VAR(64,s);
            return sh->alloc - sh->len;
        }
    }
    return 0;
}

static inline void sdssetlen(sds s, size_t newlen) {
    unsigned char flags = s[-1];
    switch(flags&SDS_TYPE_MASK) {
        case SDS_TYPE_5:
            {
                unsigned char *fp = ((unsigned char*)s)-1;
                *fp = SDS_TYPE_5 | (newlen << SDS_TYPE_BITS);
            }
            break;
        case SDS_TYPE_8:
            SDS_HDR(8,s)->len = newlen;
            break;
        case SDS_TYPE_16:
            SDS_HDR(16,s)->len = newlen;
            break;
        case SDS_TYPE_32:
            SDS_HDR(32,s)->len = newlen;
            break;
        case SDS_TYPE_64:
            SDS_HDR(64,s)->len = newlen;
            break;
    }
}

static inline void sdsinclen(sds s, size_t inc) {
    unsigned char flags = s[-1];
    switch(flags&SDS_TYPE_MASK) {
        case SDS_TYPE_5:
            {
                unsigned char *fp = ((unsigned char*)s)-1;
                unsigned char newlen = SDS_TYPE_5_LEN(flags)+inc;
                *fp = SDS_TYPE_5 | (newlen << SDS_TYPE_BITS);
            }
            break;
        case SDS_TYPE_8:
            SDS_HDR(8,s)->len += inc;
            break;
        case SDS_TYPE_16:
            SDS_HDR(16,s)->len += inc;
            break;
        case SDS_TYPE_32:
            SDS_HDR(32,s)->len += inc;
            break;
        case SDS_TYPE_64:
            SDS_HDR(64,s)->len += inc;
            break;
    }
}

/* sdsalloc() = sdsavail() + sdslen() */
static inline size_t sdsalloc(const sds s) {
    unsigned char flags = s[-1];
    switch(flags&SDS_TYPE_MASK) {
        case SDS_TYPE_5:
            return SDS_TYPE_5_LEN(flags);
        case SDS_TYPE_8:
            return SDS_HDR(8,s)->alloc;
        case SDS_TYPE_16:
            return SDS_HDR(16,s)->alloc;
        case SDS_TYPE_32:
            return SDS_HDR(32,s)->alloc;
        case SDS_TYPE_64:
            return SDS_HDR(64,s)->alloc;
    }
    return 0;
}

static inline void sdssetalloc(sds s, size_t newlen) {
    unsigned char flags = s[-1];
    switch(flags&SDS_TYPE_MASK) {
        case SDS_TYPE_5:
            /* Nothing to do, this type has no total allocation info. */
            break;
        case SDS_TYPE_8:
            SDS_HDR(8,s)->alloc = newlen;
            break;
        case SDS_TYPE_16:
            SDS_HDR(16,s)->alloc = newlen;
            break;
        case SDS_TYPE_32:
            SDS_HDR(32,s)->alloc = newlen;
            break;
        case SDS_TYPE_64:
            SDS_HDR(64,s)->alloc = newlen;
            break;
    }
}

sds sdsnewlen(const void *init, size_t initlen);
sds sdsnew(const char *init);
sds sdsempty(void);
sds sdsdup(const sds s);
void sdsfree(sds s);
sds sdsgrowzero(sds s, size_t len);
sds sdscatlen(sds s, const void *t, size_t len);
sds sdscat(sds s, const char *t);
sds sdscatsds(sds s, const sds t);
sds sdscpylen(sds s, const char *t, size_t len);
sds sdscpy(sds s, const char *t);

sds sdscatvprintf(sds s, const char *fmt, va_list ap);
#ifdef __GNUC__
sds sdscatprintf(sds s, const char *fmt, ...)
    __attribute__((format(printf, 2, 3)));
#else
sds sdscatprintf(sds s, const char *fmt, ...);
#endif

sds sdscatfmt(sds s, char const *fmt, ...);
sds sdstrim(sds s, const char *cset);
void sdsrange(sds s, int start, int end);
void sdsupdatelen(sds s);
void sdsclear(sds s);
int sdscmp(const sds s1, const sds s2);
sds *sdssplitlen(const char *s, int len, const char *sep, int seplen, int *count);
void sdsfreesplitres(sds *tokens, int count);
void sdstolower(sds s);
void sdstoupper(sds s);
sds sdsfromlonglong(long long value);
sds sdscatrepr(sds s, const char *p, size_t len);
sds *sdssplitargs(const char *line, int *argc);
sds sdsmapchars(sds s, const char *from, const char *to, size_t setlen);
sds sdsjoin(char **argv, int argc, char *sep);
sds sdsjoinsds(sds *argv, int argc, const char *sep, size_t seplen);

int sdsIsNum(sds s);

/* Low level functions exposed to the user API */
sds sdsMakeRoomFor(sds s, size_t addlen);
void sdsIncrLen(sds s, int incr);
sds sdsRemoveFreeSpace(sds s);
size_t sdsAllocSize(sds s);
void *sdsAllocPtr(sds s);

/* Export the allocator used by SDS to the program using SDS.
 * Sometimes the program SDS is linked to, may use a different set of
 * allocators, but may want to allocate or free things that SDS will
 * respectively free or allocate. */
void *sds_malloc(size_t size);
void *sds_realloc(void *ptr, size_t size);
void sds_free(void *ptr);

#ifdef REDIS_TEST
int sdsTest(int argc, char *argv[]);
#endif

#endif


================================================
FILE: dep/sds/sdsalloc.h
================================================
/* SDSLib 2.0 -- A C dynamic strings library
 *
 * Copyright (c) 2006-2015, Salvatore Sanfilippo <antirez at gmail dot com>
 * Copyright (c) 2015, Redis Labs, Inc
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

/* SDS allocator selection.
 *
 * This file is used in order to change the SDS allocator at compile time.
 * Just define the following defines to what you want to use. Also add
 * the include of your alternate allocator if needed (not needed in order
 * to use the default libc allocator). */

#include <dmalloc.h>

#define s_malloc    dalloc
#define s_realloc   drealloc
#define s_free      dfree


================================================
FILE: dep/util/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CFLAGS = -Wall -Wshadow
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value

noinst_LIBRARIES = libdutil.a

noinst_HEADERS = dspecialconfig.h dutil.h dlog.h

libdutil_a_SOURCES =    \
    dspecialconfig.h    \
	dutil.c dutil.h     \
    dlog.c dlog.h

================================================
FILE: dep/util/dlog.c
================================================
#include <stdlib.h>
#include <stdarg.h>
#include <unistd.h>
#include <ctype.h>
#include <time.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <errno.h>

#include <dutil.h>
#include <dlog.h>

static struct logger logger;

int
log_init(int level, char *name)
{
    struct logger *l = &logger;

    l->level = MAX(LOG_EMERG, MIN(level, LOG_PVERB));
    l->name = name;
    if (name == NULL || !strlen(name)) {
        l->fd = STDERR_FILENO;
    } else {
        l->fd = open(name, O_WRONLY | O_APPEND | O_CREAT, 0644);
        if (l->fd < 0) {
            log_stderr("opening log file '%s' failed: %s", name,
                       strerror(errno));
            return -1;
        }
    }

    return 0;
}

void
log_deinit(void)
{
    struct logger *l = &logger;

    if (l->fd < 0 || l->fd == STDERR_FILENO) {
        return;
    }

    close(l->fd);
}

void
log_reopen(void)
{
    struct logger *l = &logger;

    if (l->fd != STDERR_FILENO) {
        close(l->fd);
        l->fd = open(l->name, O_WRONLY | O_APPEND | O_CREAT, 0644);
        if (l->fd < 0) {
            log_stderr_safe("reopening log file '%s' failed, ignored: %s", l->name,
                       strerror(errno));
        }
    }
}

void
log_level_up(void)
{
    struct logger *l = &logger;

    if (l->level < LOG_PVERB) {
        l->level++;
        log_safe("up log level to %d", l->level);
    }
}

void
log_level_down(void)
{
    struct logger *l = &logger;

    if (l->level > LOG_EMERG) {
        l->level--;
        log_safe("down log level to %d", l->level);
    }
}

void
log_level_set(int level)
{
    struct logger *l = &logger;

    l->level = MAX(LOG_EMERG, MIN(level, LOG_PVERB));
    loga("set log level to %d", l->level);
}

void
log_stacktrace(void)
{
    struct logger *l = &logger;

    if (l->fd < 0) {
        return;
    }
    dstacktrace_fd(l->fd);
}

int
log_loggable(int level)
{
    struct logger *l = &logger;

    if (level > l->level) {
        return 0;
    }

    return 1;
}

void
_log(const char *file, int line, int level, int panic, const char *fmt, ...)
{
    struct logger *l = &logger;
    int len, size, errno_save;
    char buf[LOG_MAX_LEN];
    va_list args;
    ssize_t n;
    struct timeval tv;

    if (l->fd < 0) {
        return;
    }

    errno_save = errno;
    len = 0;            /* length of output buffer */
    size = LOG_MAX_LEN; /* size of output buffer */

    gettimeofday(&tv, NULL);
    buf[len++] = '[';
    len += dstrftime(buf + len, size - len, "%Y-%m-%d %H:%M:%S.", localtime(&tv.tv_sec));
    len += dscnprintf(buf + len, size - len, "%03ld", tv.tv_usec/1000);
    len += dscnprintf(buf + len, size - len, "] %s:%d ", file, line);

    va_start(args, fmt);
    len += dvscnprintf(buf + len, size - len, fmt, args);
    va_end(args);

    buf[len++] = '\n';

    n = write(l->fd, buf, len);
    if (n < 0) {
        l->nerror++;
    }

    errno = errno_save;

    if (panic) {
        abort();
    }
}

void
_log_stderr(const char *fmt, ...)
{
    struct logger *l = &logger;
    int len, size, errno_save;
    char buf[4 * LOG_MAX_LEN];
    va_list args;
    ssize_t n;

    errno_save = errno;
    len = 0;                /* length of output buffer */
    size = 4 * LOG_MAX_LEN; /* size of output buffer */

    va_start(args, fmt);
    len += dvscnprintf(buf, size, fmt, args);
    va_end(args);

    buf[len++] = '\n';

    n = write(STDERR_FILENO, buf, len);
    if (n < 0) {
        l->nerror++;
    }

    errno = errno_save;
}

void
_log_stdout(const char *fmt, ...)
{
    struct logger *l = &logger;
    int len, size, errno_save;
    char buf[4 * LOG_MAX_LEN];
    va_list args;
    ssize_t n;

    errno_save = errno;
    len = 0;                /* length of output buffer */
    size = 4 * LOG_MAX_LEN; /* size of output buffer */

    va_start(args, fmt);
    len += dvscnprintf(buf, size, fmt, args);
    va_end(args);

    buf[len++] = '\n';

    n = write(STDOUT_FILENO, buf, len);
    if (n < 0) {
        l->nerror++;
    }

    errno = errno_save;
}

/*
 * Hexadecimal dump in the canonical hex + ascii display
 * See -C option in man hexdump
 */
void
_log_hexdump(const char *file, int line, char *data, int datalen,
             const char *fmt, ...)
{
    struct logger *l = &logger;
    char buf[8 * LOG_MAX_LEN];
    int i, off, len, size, errno_save;
    ssize_t n;

    if (l->fd < 0) {
        return;
    }

    /* log hexdump */
    errno_save = errno;
    off = 0;                  /* data offset */
    len = 0;                  /* length of output buffer */
    size = 8 * LOG_MAX_LEN;   /* size of output buffer */

    while (datalen != 0 && (len < size - 1)) {
        char *save, *str;
        unsigned char c;
        int savelen;

        len += dscnprintf(buf + len, size - len, "%08x  ", off);

        save = data;
        savelen = datalen;

        for (i = 0; datalen != 0 && i < 16; data++, datalen--, i++) {
            c = (unsigned char)(*data);
            str = (i == 7) ? "  " : " ";
            len += dscnprintf(buf + len, size - len, "%02x%s", c, str);
        }
        for ( ; i < 16; i++) {
            str = (i == 7) ? "  " : " ";
            len += dscnprintf(buf + len, size - len, "  %s", str);
        }

        data = save;
        datalen = savelen;

        len += dscnprintf(buf + len, size - len, "  |");

        for (i = 0; datalen != 0 && i < 16; data++, datalen--, i++) {
            c = (unsigned char)(isprint(*data) ? *data : '.');
            len += dscnprintf(buf + len, size - len, "%c", c);
        }
        len += dscnprintf(buf + len, size - len, "|\n");

        off += 16;
    }

    n = write(l->fd, buf, len);
    if (n < 0) {
        l->nerror++;
    }

    if (len >= size - 1) {
        n = write(l->fd, "\n", 1);
        if (n < 0) {
            l->nerror++;
        }
    }

    errno = errno_save;
}

void
_log_safe(const char *fmt, ...)
{
    struct logger *l = &logger;
    int len, size, errno_save;
    char buf[LOG_MAX_LEN];
    va_list args;
    ssize_t n;

    if (l->fd < 0) {
        return;
    }

    errno_save = errno;
    len = 0;            /* length of output buffer */
    size = LOG_MAX_LEN; /* size of output buffer */

    len += dsafe_snprintf(buf + len, size - len, "[.......................] ");

    va_start(args, fmt);
    len += dsafe_vsnprintf(buf + len, size - len, fmt, args);
    va_end(args);

    buf[len++] = '\n';

    n = write(l->fd, buf, len);
    if (n < 0) {
        l->nerror++;
    }

    errno = errno_save;
}

void
_log_stderr_safe(const char *fmt, ...)
{
    struct logger *l = &logger;
    int len, size, errno_save;
    char buf[LOG_MAX_LEN];
    va_list args;
    ssize_t n;

    errno_save = errno;
    len = 0;            /* length of output buffer */
    size = LOG_MAX_LEN; /* size of output buffer */

    len += dsafe_snprintf(buf + len, size - len, "[.......................] ");

    va_start(args, fmt);
    len += dsafe_vsnprintf(buf + len, size - len, fmt, args);
    va_end(args);

    buf[len++] = '\n';

    n = write(STDERR_FILENO, buf, len);
    if (n < 0) {
        l->nerror++;
    }

    errno = errno_save;
}

void log_write_len(char *str, size_t len)
{
    struct logger *l = &logger;
    int errno_save;
    ssize_t n;

    if (l->fd < 0) {
        return;
    }

    errno_save = errno;
    n = write(l->fd, str, len);
    if (n < 0) {
        l->nerror++;
    }

    errno = errno_save;
}


================================================
FILE: dep/util/dlog.h
================================================
#ifndef _DLOG_H_
#define _DLOG_H_

#ifdef HAVE_CONFIG_H
# include <config.h>
#endif

struct logger {
    char *name;  /* log file name */
    int  level;  /* log level */
    int  fd;     /* log file descriptor */
    int  nerror; /* # log error */
};

#define LOG_EMERG   0   /* system in unusable */
#define LOG_ALERT   1   /* action must be taken immediately */
#define LOG_CRIT    2   /* critical conditions */
#define LOG_ERR     3   /* error conditions */
#define LOG_WARN    4   /* warning conditions */
#define LOG_NOTICE  5   /* normal but significant condition (default) */
#define LOG_INFO    6   /* informational */
#define LOG_DEBUG   7   /* debug messages */
#define LOG_VERB    8   /* verbose messages */
#define LOG_VVERB   9   /* verbose messages on crack */
#define LOG_VVVERB  10  /* verbose messages on ganga */
#define LOG_PVERB   11  /* periodic verbose messages on crack */

#define LOG_MAX_LEN 256 /* max length of log message */

/*
 * log_stderr   - log to stderr
 * loga         - log always
 * loga_hexdump - log hexdump always
 * log_error    - error log messages
 * log_warn     - warning log messages
 * log_panic    - log messages followed by a panic
 * ...
 * log_debug    - debug log messages based on a log level
 * log_hexdump  - hexadump -C of a log buffer
 */
#ifdef HAVE_DEBUG_LOG

#define log_debug(_level, ...) do {                                         \
    if (log_loggable(_level) != 0) {                                        \
        _log(__FILE__, __LINE__, _level, 0, __VA_ARGS__);                   \
    }                                                                       \
} while (0)

#else

#define log_debug(_level, ...)

#endif

#define log_hexdump(_level, _data, _datalen, ...) do {                      \
    if (log_loggable(_level) != 0) {                                        \
        _log(__FILE__, __LINE__, _level, 0, __VA_ARGS__);                   \
        _log_hexdump(__FILE__, __LINE__, (char *)(_data), (int)(_datalen),  \
                     __VA_ARGS__);                                          \
    }                                                                       \
} while (0)

#define log_stderr(...) do {                                                \
    _log_stderr(__VA_ARGS__);                                               \
} while (0)

#define log_stdout(...) do {                                                \
    _log_stdout(__VA_ARGS__);                                               \
} while (0)

#define log_safe(...) do {                                                  \
    _log_safe(__VA_ARGS__);                                                 \
} while (0)

#define log_stderr_safe(...) do {                                           \
    _log_stderr_safe(__VA_ARGS__);                                          \
} while (0)

#define loga(...) do {                                                      \
    _log(__FILE__, __LINE__, LOG_EMERG, 0, __VA_ARGS__);                    \
} while (0)

#define loga_hexdump(_data, _datalen, ...) do {                             \
    _log(__FILE__, __LINE__, LOG_EMERG, 0, __VA_ARGS__);                    \
    _log_hexdump(__FILE__, __LINE__, (char *)(_data), (int)(_datalen),      \
                 __VA_ARGS__);                                              \
} while (0)                                                                 \

#define log_error(...) do {                                                 \
    if (log_loggable(LOG_ERR) != 0) {                                       \
        _log(__FILE__, __LINE__, LOG_ERR, 0, __VA_ARGS__);                  \
    }                                                                       \
} while (0)

#define log_warn(...) do {                                                  \
    if (log_loggable(LOG_WARN) != 0) {                                      \
        _log(__FILE__, __LINE__, LOG_WARN, 0, __VA_ARGS__);                 \
    }                                                                       \
} while (0)

#define log_notice(...) do {                                                \
    if (log_loggable(LOG_NOTICE) != 0) {                                    \
        _log(__FILE__, __LINE__, LOG_NOTICE, 0, __VA_ARGS__);               \
    }                                                                       \
} while (0)

#define log_panic(...) do {                                                 \
    if (log_loggable(LOG_EMERG) != 0) {                                     \
        _log(__FILE__, __LINE__, LOG_EMERG, 1, __VA_ARGS__);                \
    }                                                                       \
} while (0)

int log_init(int level, char *filename);
void log_deinit(void);
void log_level_up(void);
void log_level_down(void);
void log_level_set(int level);
void log_stacktrace(void);
void log_reopen(void);
int log_loggable(int level);

void _log(const char *file, int line, int level, int panic, const char *fmt, ...);
void _log_stderr(const char *fmt, ...);
void _log_stdout(const char *fmt, ...);
void _log_safe(const char *fmt, ...);
void _log_stderr_safe(const char *fmt, ...);
void _log_hexdump(const char *file, int line, char *data, int datalen, const char *fmt, ...);

void log_write_len(char * str, size_t len);

#endif


================================================
FILE: dep/util/dspecialconfig.h
================================================
#ifndef _DSPECIALCONFIG_H_
#define _DSPECIALCONFIG_H_

#ifdef __APPLE__
#include <AvailabilityMacros.h>
#endif

#ifdef __linux__
#include <linux/version.h>
#include <features.h>
#endif

#if (__i386 || __amd64 || __powerpc__) && __GNUC__
#define GNUC_VERSION (__GNUC__ * 10000 + __GNUC_MINOR__ * 100 + __GNUC_PATCHLEVEL__)
#if defined(__clang__)
#define HAVE_ATOMIC
#endif
#if (defined(__GLIBC__) && defined(__GLIBC_PREREQ))
#if (GNUC_VERSION >= 40100 && __GLIBC_PREREQ(2, 6))
#define HAVE_ATOMIC
#endif
#endif
#endif


#if defined(__sun)
#if defined(__GNUC__)
#include <math.h>
#undef isnan
#define isnan(x) \
     __extension__({ __typeof (x) __x_a = (x); \
     __builtin_expect(__x_a != __x_a, 0); })

#undef isfinite
#define isfinite(x) \
     __extension__ ({ __typeof (x) __x_f = (x); \
     __builtin_expect(!isnan(__x_f - __x_f), 1); })

#undef isinf
#define isinf(x) \
     __extension__ ({ __typeof (x) __x_i = (x); \
     __builtin_expect(!isnan(__x_i) && !isfinite(__x_i), 0); })

#define u_int uint
#define u_int32_t uint32_t
#endif /* __GNUC__ */
#endif /* __sun */


/* Test for proc filesystem */
#ifdef __linux__
#define HAVE_PROC_STAT 1
#define HAVE_PROC_MAPS 1
#define HAVE_PROC_SMAPS 1
#define HAVE_PROC_SOMAXCONN 1
#endif

/* Test for task_info() */
#if defined(__APPLE__)
#define HAVE_TASKINFO 1
#endif


#endif


================================================
FILE: dep/util/dutil.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <stdarg.h>
#include <string.h>
#include <unistd.h>
#include <fcntl.h>
#include <netdb.h>
#include <errno.h>

#include <sys/time.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <sys/ioctl.h>

#include <netinet/in.h>
#include <netinet/tcp.h>

#ifdef HAVE_CONFIG_H
# include <config.h>
#endif

#ifdef HAVE_BACKTRACE
# include <execinfo.h>
#endif

#include <dlog.h>
#include <dutil.h>

/* GCC version >= 4.7 */
#if defined(__ATOMIC_RELAXED)
/* GCC version >= 4.1 */
#elif defined(HAVE_ATOMIC)
#else
pthread_mutex_t atomic_locker = PTHREAD_MUTEX_INITIALIZER;
#endif

void
dassert(const char *cond, const char *file, int line, int panic)
{
    log_error("assert '%s' failed @ (%s, %d)", cond, file, line);

    if (panic) {
        dstacktrace(1);
        abort();
    }
}

void
dstacktrace(int skip_count)
{
#ifdef HAVE_BACKTRACE
    void *stack[64];
    char **symbols;
    int size, i, j;

    size = backtrace(stack, 64);
    symbols = backtrace_symbols(stack, size);
    if (symbols == NULL) {
        return;
    }

    skip_count++; /* skip the current frame also */

    for (i = skip_count, j = 0; i < size; i++, j++) {
        loga("[%d] %s", j, symbols[i]);
    }

    free(symbols);
#endif
}

void
dstacktrace_fd(int fd)
{
#ifdef HAVE_BACKTRACE
    void *stack[64];
    int size;

    size = backtrace(stack, 64);
    backtrace_symbols_fd(stack, size, fd);
#endif
}

int
_dvscnprintf(char *buf, size_t size, const char *fmt, va_list args)
{
    int n;

    n = vsnprintf(buf, size, fmt, args);

    /*
     * The return value is the number of characters which would be written
     * into buf not including the trailing '\0'. If size is == 0 the
     * function returns 0.
     *
     * On error, the function also returns 0. This is to allow idiom such
     * as len += _vscnprintf(...)
     *
     * See: http://lwn.net/Articles/69419/
     */
    if (n <= 0) {
        return 0;
    }

    if (n < (int) size) {
        return n;
    }

    return (int)(size - 1);
}

int
_dscnprintf(char *buf, size_t size, const char *fmt, ...)
{
    va_list args;
    int n;

    va_start(args, fmt);
    n = _dvscnprintf(buf, size, fmt, args);
    va_end(args);

    return n;
}

static char *
_safe_utoa(int _base, uint64_t val, char *buf)
{
    char hex[] = "0123456789abcdef";
    uint32_t base = (uint32_t) _base;
    *buf-- = 0;
    do {
        *buf-- = hex[val % base];
    } while ((val /= base) != 0);
    return buf + 1;
}

static char *
_safe_itoa(int base, int64_t val, char *buf)
{
    char hex[] = "0123456789abcdef";
    char *orig_buf = buf;
    const int32_t is_neg = (val < 0);
    *buf-- = 0;

    if (is_neg) {
        val = -val;
    }
    if (is_neg && base == 16) {
        int ix;
        val -= 1;
        for (ix = 0; ix < 16; ++ix)
            buf[-ix] = '0';
    }

    do {
        *buf-- = hex[val % base];
    } while ((val /= base) != 0);

    if (is_neg && base == 10) {
        *buf-- = '-';
    }

    if (is_neg && base == 16) {
        int ix;
        buf = orig_buf - 1;
        for (ix = 0; ix < 16; ++ix, --buf) {
            /* *INDENT-OFF* */
            switch (*buf) {
            case '0': *buf = 'f'; break;
            case '1': *buf = 'e'; break;
            case '2': *buf = 'd'; break;
            case '3': *buf = 'c'; break;
            case '4': *buf = 'b'; break;
            case '5': *buf = 'a'; break;
            case '6': *buf = '9'; break;
            case '7': *buf = '8'; break;
            case '8': *buf = '7'; break;
            case '9': *buf = '6'; break;
            case 'a': *buf = '5'; break;
            case 'b': *buf = '4'; break;
            case 'c': *buf = '3'; break;
            case 'd': *buf = '2'; break;
            case 'e': *buf = '1'; break;
            case 'f': *buf = '0'; break;
            }
            /* *INDENT-ON* */
        }
    }
    return buf + 1;
}

static const char *
_safe_check_longlong(const char *fmt, int *have_longlong)
{
    *have_longlong = 0;
    if (*fmt == 'l') {
        fmt++;
        if (*fmt != 'l') {
            *have_longlong = (sizeof(long) == sizeof(long long));
        } else {
            fmt++;
            *have_longlong = 1;
        }
    }
    return fmt;
}

int
_safe_vsnprintf(char *to, size_t size, const char *format, va_list ap)
{
    char *start = to;
    char *end = start + size - 1;
    for (; *format; ++format) {
        int have_longlong = 0;
        if (*format != '%') {
            if (to == end) {    /* end of buffer */
                break;
            }
            *to++ = *format;    /* copy ordinary char */
            continue;
        }
        ++format;               /* skip '%' */

        format = _safe_check_longlong(format, &have_longlong);

        switch (*format) {
        case 'd':
        case 'i':
        case 'u':
        case 'x':
        case 'p':
            {
                int64_t ival = 0;
                uint64_t uval = 0;
                if (*format == 'p')
                    have_longlong = (sizeof(void *) == sizeof(uint64_t));
                if (have_longlong) {
                    if (*format == 'u') {
                        uval = va_arg(ap, uint64_t);
                    } else {
                        ival = va_arg(ap, int64_t);
                    }
                } else {
                    if (*format == 'u') {
                        uval = va_arg(ap, uint32_t);
                    } else {
                        ival = va_arg(ap, int32_t);
                    }
                }

                {
                    char buff[22];
                    const int base = (*format == 'x' || *format == 'p') ? 16 : 10;

		            /* *INDENT-OFF* */
                    char *val_as_str = (*format == 'u') ?
                        _safe_utoa(base, uval, &buff[sizeof(buff) - 1]) :
                        _safe_itoa(base, ival, &buff[sizeof(buff) - 1]);
		            /* *INDENT-ON* */

                    /* Strip off "ffffffff" if we have 'x' format without 'll' */
                    if (*format == 'x' && !have_longlong && ival < 0) {
                        val_as_str += 8;
                    }

                    while (*val_as_str && to < end) {
                        *to++ = *val_as_str++;
                    }
                    continue;
                }
            }
        case 's':
            {
                const char *val = va_arg(ap, char *);
                if (!val) {
                    val = "(null)";
                }
                while (*val && to < end) {
                    *to++ = *val++;
                }
                continue;
            }
        }
    }
    *to = 0;
    return (int)(to - start);
}

int
_safe_snprintf(char *to, size_t n, const char *fmt, ...)
{
    int result;
    va_list args;
    va_start(args, fmt);
    result = _safe_vsnprintf(to, n, fmt, args);
    va_end(args);
    return result;
}

/*
 * Return the current time in microseconds since Epoch
 */
long long
dusec_now(void)
{
    struct timeval now;
    int64_t usec;
    int status;

    status = gettimeofday(&now, NULL);
    if (status < 0) {
        log_error("gettimeofday failed: %s", strerror(errno));
        return -1;
    }

    usec = (int64_t)now.tv_sec * 1000000LL + (int64_t)now.tv_usec;

    return usec;
}

/*
 * Return the current time in milliseconds since Epoch
 */
long long
dmsec_now(void)
{
    return dusec_now() / 1000LL;
}

/*
 * Return the current time in seconds since Epoch
 */
long long
dsec_now(void)
{
    return dusec_now() / 1000000LL;
}

/* Glob-style pattern matching. */
int string_match_len(const char *pattern, int patternLen,
        const char *string, int stringLen, int nocase)
{
    while(patternLen) {
        switch(pattern[0]) {
        case '*':
            while (pattern[1] == '*') {
                pattern++;
                patternLen--;
            }
            if (patternLen == 1)
                return 1; /* match */
            while(stringLen) {
                if (string_match_len(pattern+1, patternLen-1,
                            string, stringLen, nocase))
                    return 1; /* match */
                string++;
                stringLen--;
            }
            return 0; /* no match */
            break;
        case '?':
            if (stringLen == 0)
                return 0; /* no match */
            string++;
            stringLen--;
            break;
        case '[':
        {
            int not, match;

            pattern++;
            patternLen--;
            not = pattern[0] == '^';
            if (not) {
                pattern++;
                patternLen--;
            }
            match = 0;
            while(1) {
                if (pattern[0] == '\\') {
                    pattern++;
                    patternLen--;
                    if (pattern[0] == string[0])
                        match = 1;
                } else if (pattern[0] == ']') {
                    break;
                } else if (patternLen == 0) {
                    pattern--;
                    patternLen++;
                    break;
                } else if (pattern[1] == '-' && patternLen >= 3) {
                    int start = pattern[0];
                    int end = pattern[2];
                    int c = string[0];
                    if (start > end) {
                        int t = start;
                        start = end;
                        end = t;
                    }
                    if (nocase) {
                        start = tolower(start);
                        end = tolower(end);
                        c = tolower(c);
                    }
                    pattern += 2;
                    patternLen -= 2;
                    if (c >= start && c <= end)
                        match = 1;
                } else {
                    if (!nocase) {
                        if (pattern[0] == string[0])
                            match = 1;
                    } else {
                        if (tolower((int)pattern[0]) == tolower((int)string[0]))
                            match = 1;
                    }
                }
                pattern++;
                patternLen--;
            }
            if (not)
                match = !match;
            if (!match)
                return 0; /* no match */
            string++;
            stringLen--;
            break;
        }
        case '\\':
            if (patternLen >= 2) {
                pattern++;
                patternLen--;
            }
            /* fall through */
        default:
            if (!nocase) {
                if (pattern[0] != string[0])
                    return 0; /* no match */
            } else {
                if (tolower((int)pattern[0]) != tolower((int)string[0]))
                    return 0; /* no match */
            }
            string++;
            stringLen--;
            break;
        }
        pattern++;
        patternLen--;
        if (stringLen == 0) {
            while(*pattern == '*') {
                pattern++;
                patternLen--;
            }
            break;
        }
    }
    if (patternLen == 0 && stringLen == 0)
        return 1;
    return 0;
}

int string_match(const char *pattern, const char *string, int nocase) {
    return string_match_len(pattern,strlen(pattern),string,strlen(string),nocase);
}


================================================
FILE: dep/util/dutil.h
================================================
#ifndef _DUTIL_H_
#define _DUTIL_H_

#include <stdarg.h>

#include <dspecialconfig.h>

#define UNUSED(x) (void)(x)

#define LF                  (uint8_t) 10
#define CR                  (uint8_t) 13
#define CRLF                "\x0d\x0a"
#define CRLF_LEN            (sizeof("\x0d\x0a") - 1)

#define NELEMS(a)           ((sizeof(a)) / sizeof((a)[0]))

#define MIN(a, b)           ((a) < (b) ? (a) : (b))
#define MAX(a, b)           ((a) > (b) ? (a) : (b))

#define SQUARE(d)           ((d) * (d))
#define VAR(s, s2, n)       (((n) < 2) ? 0.0 : ((s2) - SQUARE(s)/(n)) / ((n) - 1))
#define STDDEV(s, s2, n)    (((n) < 2) ? 0.0 : sqrt(VAR((s), (s2), (n))))

/*
 * Wrappers for defining custom assert based on whether macro
 * RMT_ASSERT_PANIC or RMT_ASSERT_LOG was defined at the moment
 * ASSERT was called.
 */
#ifdef HAVE_ASSERT_PANIC

#define ASSERT(_x) do {                         \
    if (!(_x)) {                                \
        dassert(#_x, __FILE__, __LINE__, 1);  \
    }                                           \
} while (0)

#define NOT_REACHED() ASSERT(0)

#elif HAVE_ASSERT_LOG

#define ASSERT(_x) do {                         \
    if (!(_x)) {                                \
        dassert(#_x, __FILE__, __LINE__, 0);  \
    }                                           \
} while (0)

#define NOT_REACHED() ASSERT(0)

#else

#define ASSERT(_x)

#define NOT_REACHED()

#endif

void dassert(const char *cond, const char *file, int line, int panic);
void dstacktrace(int skip_count);
void dstacktrace_fd(int fd);

int _dscnprintf(char *buf, size_t size, const char *fmt, ...);
int _dvscnprintf(char *buf, size_t size, const char *fmt, va_list args);
long long dusec_now(void);
long long dmsec_now(void);
long long dsec_now(void);

/*
 * A (very) limited version of snprintf
 * @param   to   Destination buffer
 * @param   n    Size of destination buffer
 * @param   fmt  printf() style format string
 * @returns Number of bytes written, including terminating '\0'
 * Supports 'd' 'i' 'u' 'x' 'p' 's' conversion
 * Supports 'l' and 'll' modifiers for integral types
 * Does not support any width/precision
 * Implemented with simplicity, and async-signal-safety in mind
 */
int _safe_vsnprintf(char *to, size_t size, const char *format, va_list ap);
int _safe_snprintf(char *to, size_t n, const char *fmt, ...);

#define dsafe_snprintf(_s, _n, ...)       \
    _safe_snprintf((char *)(_s), (size_t)(_n), __VA_ARGS__)

#define dsafe_vsnprintf(_s, _n, _f, _a)   \
    _safe_vsnprintf((char *)(_s), (size_t)(_n), _f, _a)

/*
 * snprintf(s, n, ...) will write at most n - 1 of the characters printed into
 * the output string; the nth character then gets the terminating `\0'; if
 * the return value is greater than or equal to the n argument, the string
 * was too short and some of the printed characters were discarded; the output
 * is always null-terminated.
 *
 * Note that, the return value of snprintf() is always the number of characters
 * that would be printed into the output string, assuming n were limited not
 * including the trailing `\0' used to end output.
 *
 * scnprintf(s, n, ...) is same as snprintf() except, it returns the number
 * of characters printed into the output string not including the trailing '\0'
 */
#define dsnprintf(_s, _n, ...)        \
    snprintf((char *)(_s), (size_t)(_n), __VA_ARGS__)

#define dscnprintf(_s, _n, ...)       \
    _dscnprintf((char *)(_s), (size_t)(_n), __VA_ARGS__)

#define dvsnprintf(_s, _n, _f, _a)    \
    vsnprintf((char *)(_s), (size_t)(_n), _f, _a)

#define dvscnprintf(_s, _n, _f, _a)   \
    _dvscnprintf((char *)(_s), (size_t)(_n), _f, _a)

#define dstrftime(_s, _n, fmt, tm)        \
    (int)strftime((char *)(_s), (size_t)(_n), fmt, tm)

int string_match_len(const char *pattern, int patternLen, const char *string, int stringLen, int nocase);
int string_match(const char *pattern, const char *string, int nocase);


/* Atomic API */
/* GCC version >= 4.7 */
#if defined(__ATOMIC_RELAXED)
#define atomic_add(_value, _n) __atomic_add_fetch(&_value, (_n), __ATOMIC_RELAXED)
#define atomic_sub(_value, _n) __atomic_sub_fetch(&_value, (_n), __ATOMIC_RELAXED)
#define atomic_set(_value, _n) __atomic_store_n(&_value, (_n), __ATOMIC_RELAXED)
#define atomic_get(_value, _v) do {                 \
    __atomic_load(&_value, _v, __ATOMIC_RELAXED);   \
} while(0)

#define ATOMIC_LOCK_TYPE "__ATOMIC_RELAXED"
/* GCC version >= 4.1 */
#elif defined(HAVE_ATOMIC)
#define atomic_add(_value, _n) __sync_add_and_fetch(&_value, (_n))
#define atomic_sub(_value, _n) __sync_sub_and_fetch(&_value, (_n))
#define atomic_set(_value, _n) __sync_lock_test_and_set(&_value, (_n))
#define atomic_get(_value, _v) do {                 \
    (*_v) = __sync_add_and_fetch(&_value, 0);       \
} while(0)

#define ATOMIC_LOCK_TYPE "HAVE_ATOMIC"
#else
extern pthread_mutex_t atomic_locker;

#define atomic_add(_value, _n) do {         \
    pthread_mutex_lock(&atomic_locker);     \
    _value += (_n);                         \
    pthread_mutex_unlock(&atomic_locker);   \
} while(0)

#define atomic_sub(_value, _n) do {         \
    pthread_mutex_lock(&atomic_locker);     \
    _value -= (_n);                         \
    pthread_mutex_unlock(&atomic_locker);   \
} while(0)

#define atomic_set(_value, _n) do {         \
    pthread_mutex_lock(&atomic_locker);     \
    _value = (_n);                          \
    pthread_mutex_unlock(&atomic_locker);   \
} while(0)

#define atomic_get(_value, _v) do {         \
    pthread_mutex_lock(&atomic_locker);     \
    (*_v) = _value;                         \
    pthread_mutex_unlock(&atomic_locker);   \
} while(0)

#define ATOMIC_LOCK_TYPE "pthread_mutex_lock"
#endif

#endif


================================================
FILE: m4/.gitignore
================================================
# Ignore everything
*

# Except me
!.gitignore


================================================
FILE: notes/c-styleguide.txt
================================================
- No literal tabs. Expand tabs to 4 spaces.
- Indentation is 4 spaces.
- No more than 3 levels of indentation, otherwise you should think about
  refactoring your code.
- Use one statement per line.
- Make sure that your editor does not leave space at the end of the line.
- snake_case for variable, function and file names.
- Use your own judgment when naming variables and functions. Be as Spartan
  as possible. Eg: Using name like this_variable_is_a_temporary_counter
  will usually be frowned upon.
- Don’t use local variables or parameters that shadow global identifiers.
  GCC’s ‘-Wshadow’ option can help you to detect this problem.

- Avoid using int, char, short, long. Instead use int8_t uint8_t, int16_t,
  uint16_t, int32_t, uint32_t, int64_t, uint64_t, which are available in
  <stdint.h>. However, when interfacing with system calls and libraries
  you cannot get away from using int and char.
- Use bool for boolean variables. You have to include <stdbool.h>
- Avoid using a bool as type for struct member names. Instead use unsigned
  1-bit bit field. Eg:
  struct foo {
      unsigned is_bar:1;
  };
- Always use size_t type when dealing with sizes of objects or memory ranges.
- Your code should be 64-bit and 32-bit friendly. Bear in mind problems
  of printing, comparisons, and structure alignment. You have to include
  <intyptes.h> to get generic format specifier macros for printing.

- 80 column line limit.
- If you have to wrap a long statement (> 80 column), put the operator at the
  end of the line and indent the next line at the same column as the arguments
  in the previous column. Eg:
    while (cnt < 20 && this_variable_name_is_too_long &&
           ep != NULL) {
        z = a + really + long + statement + that + needs + three + lines +
            gets + indented + on + the + same + column + as + the +
            previous + column
    }

    and:

    int a = function(param_a, param_b, param_c, param_d, param_e, param_f,
                     param_g, param_h, param_i, param_j, param_k, param_l);

- Always use braces for all conditional blocks (if, switch, for, while, do).
  This holds good even for single statement conditional blocks. Eg:
    if (cond) {
        stmt;
    }
- Placement of braces for non-function statement blocks - put opening brace
  last on the line and closing brace first. Eg:
    if (x is true) {
        we do y
    }
- Placement of brace for functions - put the opening brace at the beginning
  of the next line and closing brace first. This is useful because several
  tools look for opening brace in column one to find beginning of C
  functions. Eg:
int
function(int x)
{
    body of the function
}

- Closing brace is empty on a line of its own, except in cases where it is
  followed by a continuation of the same statement, i.e. a "while" in a
  do-statement or an "else" in an if-statement, like this:
    do {
        body of do-loop
    } while (condition);

    and,

    if (x == y) {
        ..
    } else if (x > y) {
        ...
    } else {
        ....
    }

- Column align switch keyword and the corresponding case/default keyword. Eg:
    switch (alphabet) {
    case 'a':
    case 'b':
        printf("I am a or b\n");
        break;

    default:
        break;
    }

- Forever loops are done with for, and not while. Eg:
    for (;;) {
        stmt;
    }

- Don't use a space after a function name.
- Do not needlessly surround the return expression with parentheses.
- Use space after keywords. Exceptions are sizeof, typeof, alignof and
  __attribute__, which look like functions.
- Do not add spaces around (inside) parenthesized expressions.
    s = sizeof( sizeof(*p)) ); /* bad example */
    s = sizeof(sizeof(*p));    /* good example */
- Casts should not be followed by space. Eg:
  int q = *(int *)&p
- There is no need to type cast when assigning a void pointer to a non-void
  pointer, or vice versa.
- Avoid using goto statements. However there are some exceptions to this rule
  when a single goto label within a function and one or more goto statements
  come in handy when a function exits from multiple locations and some common
  work such as cleanup has to be done. Eg:
int
fun(void)
{
    int result = 0;
    char *buffer;

    buffer = malloc(1024);
    if (buffer == NULL) {
        return -1;
    }

    if (condition1) {
        while (loop1) {
            ...
        }
        result = 1;
        goto out;
    }

    ...
out:
    free(buffer);
    return result;
}
- When declaring pointer data, use '*' adjacent to the data name and not
  adjacent to the type name. Eg:
    int
    function(int *p)
    {
        char *p;
        <body of the function>
    }
- Use one space around (on each side of) most binary and ternary operators,
  such as any of these:
    =  +  -  <  >  *  /  %  |  &  ^  <=  >=  ==  !=  ?  :
  but no space after unary operators:
    &  *  +  -  ~  !  sizeof typeof alignof  __attribute__  defined
  no space before the postfix increment & decrement unary operators:
    ++  --
  and no space around the '.' and "->" structure member operators.

- 0 and NULL; use 0 for integers, 0.0 for doubles, NULL for pointers, and
  '\0' for chars.
- Test pointers against NULL. E.g, use:
    if (p == NULL)

    not:

    !(p)

- Do not use ! for tests unless it is a boolean. E.g. use:
    if (*p == '\0')

    not:

    if (!*p)

- Don't use assignments inside if or while-conditions. E.g, use:

    struct foo *foo;
    foo = malloc(sizeof(*foo));
    if (foo == NULL) {
        return -1
    }

    not:

    struct foo *foo;
    if ((foo = malloc(sizeof(*foo))) == NULL) {
        return -1;
    }

- Don't ever use typedef for structure types. Typedefs are problematic
  because they do not properly hide their underlying type; for example you
  need to know if the typedef is the structure itself or a pointer to the
  structure. In addition they must be declared exactly once, whereas an
  incomplete structure type can be mentioned as many times as necessary.
  Typedefs are difficult to use in stand-alone header files: the header
  that defines the typedef must be included before the header that uses it,
  or by the header that uses it (which causes namespace pollution), or
  there must be a back-door mechanism for obtaining the typedef.
- The only exception for using a typedef is when you are defining a type
  for a function pointer or a type for an enum. Eg:

  typedef void (*foo_handler_t)(int, void *);

  or:

  typedef enum types {
      TYPE_1,
      TYPE_2
  } types_t;

- Use just one variable declaration per line when variables are part of a
  struct. This leaves you room for a small comment on each item, explaining
  its use. Declarations should also be aligned. Eg, use:

  struct foo {
    int      *foo_a;   /* comment for foo_a */
    int      foo_b;    /* comment for foo_b */
    unsigned foo_c:1;  /* comment for foo_c */
  };

  and not:

  struct foo {
    int *foo_a, foo_b;
    unsigned foo_c:1;
  };

- For variable declaration outside a struct, either collect all the
  declarations of the same type on a single line, or use one variable
  per line if the variables purpose needs to be commented. Eg:
  char *a, *b, c;

  or:

  char *a, *b;
  char c;       /* comments for c */

- Avoid magic numbers because no-one has a clue (including the author) of
  what it means after a month.

- Function definitions should start the name of the function in column
  one. This is useful because it makes searching for function definitions
  fairly trivial. Eg:
static char *
concat(char *s1, char *s2)
{
  body of the function
}

- Function and variables local to a file should be static.
- Separate two successive functions with one blank line.
- Include parameter names with their datypes in function declaration. Eg:
void function(int param);

- Functions should be short and sweet, and do just one thing. They should
  fit on one or two screenfuls of text (80 x 24 screen size), and do one
  thing and do that well.
  The maximum length of a function is inversely proportional to the
  complexity and indentation level of that function. So, if you have a
  conceptually simple function that is just one long (but simple)
  case-statement, where you have to do lots of small things for a lot of
  different cases, it's OK to have a longer function.
  Another measure of the function is the number of local variables. They
  shouldn't exceed 5-10, or you're doing something wrong. Re-think the
  function, and split it into smaller pieces. A human brain can
  generally easily keep track of about 7 different things, anything more
  and it gets confused. You know you're brilliant, but maybe you'd like
  to understand what you did 2 weeks from now.
- Use const for function parameters passed by reference, if the passed
  pointer has no side effect.

- C style comments only. Don't use // for single line comments. Instead
  use /* ... */ style.
- For multi-line comments use the following style
    /*
     * This is the preferred style for multi-line
     * comments in the Linux kernel source code.
     * Please use it consistently.
     *
     * Description:  A column of asterisks on the left side,
     * with beginning and ending almost-blank lines.
     */

- To comment out block of code spanning several lines use preprocessor
  directive "#ifdef 0 ... #endif"

- Please write a brief comment at the start of each source file, with the
  file name and a line or two about the overall purpose of the file.

- All major functions should have comments describing what they do at the
  head of the function. Avoid putting comments in the function body unless
  absolutely needed. If possible, add a comment on what sorts of arguments
  the function gets, and what the possible values of arguments mean and
  what they are used for and the significance of return value if there is
  one. It is not necessary to duplicate in words the meaning of the C
  argument declarations, if a C type is being used in its customary fashion.
  If there is anything nonstandard about its use (such as an argument of
  type char * which is really the address of the second character of a
  string, not the first), or any possible values that would not work the
  way one would expect (such as, that strings containing newlines are not
  guaranteed to work), be sure to say so. Eg:

/*
 * Try to acquire a physical address lock while a pmap is locked. If we
 * fail to trylock we unlock and lock the pmap directly and cache the
 * locked pa in *locked. The caller should then restart their loop in case
 * the virtual to physical mapping has changed.
 *
 * Returns 0 on success and -1 on failure.
 */
int
vm_page_pa_tryrelock(pmap_t pmap, vm_paddr_t pa, vm_paddr_t *locked)
{
    ...

- The comment on a function is much clearer if you use the argument names
  to speak about the argument values. The variable name itself should be
  lower case, but write it in upper case when you are speaking about the
  value rather than the variable itself. Thus, “the inode number NODE_NUM”
  rather than “an inode”.

- Every struct definition should have an accompanying comment that
  describes what it is for and how it should be used.

- Finally, while comments are absolutely important to keep the code readable,
  remember that the best code is self-documenting. Giving sensible names to
  types and variables is much better than using obscure names that you must
  then explain through comments.

- Recommend using UPPERCASE for macro names. However, sometimes using
  lowercase for macro names makes sense when macros masquerade as well-known
  function calls. Eg, it makes sense to write the wrapper for the
  standard free() function in lowercase to keep the readability
  consistent:

#define my_free(_p) do {    \
    free(_p);               \
    (_p) = NULL;            \
} while (0)

- Use enums when defining more than one related constants. All enumeration
  values are in UPPERCASE.
- Avoid macros as much as possible and use inline functions, enums and const
  variables wherever you can.
- For macros encapsulating compound statements, right justify the backslashes
  and enclose it in do { ... } while (0)
- For parameterized macros, all the parameters used in the macro body must
  be surrounded by parentheses. Eg:
  #define ADD_1(_x) ((_x) + 1)

- Use sizeof(varname) instead of sizeof(type) whenever possible. Eg:
  char *p;
  p = malloc(sizeof(*p));   /* good example */
  p = malloc(sizeof(char)); /* bad example */

- All variables should be declared at the beginning of a scope block {..}.
  It is even preferred to declare all variables at the beginning of the
  function so that all the local variable declarations is in one place and
  we can see the comprehensive list in one glance.
- Global structs should be declared at the top of the file in which they
  are used, or in separate header files if they are used in multiple
  source files.
- Declarations of external functions and functions to appear later in the
  source file should all go in one place near the beginning of the file,
  somewhere before the first function definition in the file or else
  should go in a header file.
- Use of extern should be considered as evil, if it is used in header files
  to reference global variables.
- Don’t put extern declarations inside functions.

- Usually every *.c file should have an associated *.h file. There are some
  exceptions to this rule, such as unit tests and small *.c files containing
  just the main() function.
- Every header file in the source code must have preprocessor conditional
  to prevent the header file from being scanned multiple times and avoiding
  mutual dependency cycles. Alternatively you can use #pragma once directive,
  as it avoids name clashes and increases the compile speed. Eg, for a
  header file named foo.h, the entire contents of the header file must be
  between the guard macros as follows:

#ifndef _FOO_H_
#define _FOO_H_
...
#endif /* _FOO_H_ */

Or,

#pragma once
#ifndef _FOO_H_
#define _FOO_H_
...
#endif /* _FOO_H_ */

- Don't use #include when a forward declaration would suffice.
- Functions defined in header files should be static inline.

- Don’t make the program ugly just to placate GCC when extra warnings options
  such as ‘-Wconversion’ or ‘-Wundef’ are used. These options can help in
  finding bugs, but they can also generate so many false alarms that that
  it hurts readability to silence them with unnecessary casts, wrappers, and
  other complications.

- Conditional compilation: when supporting configuration options already
  known when building your program we prefer using if (... ) over conditional
  compilation, as in the former case the compiler is able to perform more
  extensive checking of all possible code paths. Eg, use:

  if (HAS_FOO)
    ...
  else
    ...

instead of:

  #ifdef HAS_FOO
    ...
  #else
    ...
  #endif

  A modern compiler such as GCC will generate exactly the same code in both
  cases and of course, the former method assumes that HAS_FOO is defined as
  either 0 or 1.

- Finally, rules are rules. Sometimes they are sensible and sometimes not
  and regardless of your preference, we would like you to follow them.
  A project is easier to follow if all project contributors follow the style
  rules so that they can all read and understand everyone's code easily. But
  remember, like all good rules, they are exceptions where it makes sense not
  to be too rigid on the grounds of common sense and consistency!


================================================
FILE: notes/debug.txt
================================================
- strace
  strace -o strace.txt -ttT -s 1024 -p `pgrep nutcracker`

- libyaml (yaml-0.1.4)

  - yaml tokens:

  0  YAML_NO_TOKEN,
  1  YAML_STREAM_START_TOKEN,
  2  YAML_STREAM_END_TOKEN,
  3  YAML_VERSION_DIRECTIVE_TOKEN,
  4  YAML_TAG_DIRECTIVE_TOKEN,
  5  YAML_DOCUMENT_START_TOKEN,
  6  YAML_DOCUMENT_END_TOKEN,
  7  YAML_BLOCK_SEQUENCE_START_TOKEN,
  8  YAML_BLOCK_MAPPING_START_TOKEN,
  9  YAML_BLOCK_END_TOKEN,
  10 YAML_FLOW_SEQUENCE_START_TOKEN,
  11 YAML_FLOW_SEQUENCE_END_TOKEN,
  12 YAML_FLOW_MAPPING_START_TOKEN,
  13 YAML_FLOW_MAPPING_END_TOKEN,
  14 YAML_BLOCK_ENTRY_TOKEN,
  15 YAML_FLOW_ENTRY_TOKEN,
  16 YAML_KEY_TOKEN,
  17 YAML_VALUE_TOKEN,
  18 YAML_ALIAS_TOKEN,
  19 YAML_ANCHOR_TOKEN,
  20 YAML_TAG_TOKEN,
  21 YAML_SCALAR_TOKEN

  - yaml events

  0  YAML_NO_EVENT,
  1  YAML_STREAM_START_EVENT,
  2  YAML_STREAM_END_EVENT,
  3  YAML_DOCUMENT_START_EVENT,
  4  YAML_DOCUMENT_END_EVENT,
  5  YAML_ALIAS_EVENT,
  6  YAML_SCALAR_EVENT,
  7  YAML_SEQUENCE_START_EVENT,
  8  YAML_SEQUENCE_END_EVENT,
  9  YAML_MAPPING_START_EVENT,
  10 YAML_MAPPING_END_EVENT

- sys/queue.h

  queue.h is a generic linked list library adapted from BSD. It has three
  macro knobs that are useful for debugging:

  - QUEUE_MACRO_SCRUB nullifies links (next and prev pointers) of deleted
    elements and catches cases where we are attempting to do operations
    on an element that has already been unlinked.
  - QUEUE_MACRO_TRACE keeps track of __FILE__ and __LINE__ of last two
    updates to the list data structure.
  - QUEUE_MACRO_ASSERT verifies the sanity of list data structure on every
    operation.

- valgrind
  valgrind --tool=memcheck --leak-check=yes <program>

- Core dump
  ulimit -c unlimited

- Generate ENOMEM to test "Out of Memory"
  ulimit -m <size>    # limit maximum memory size
  ulimit -v <size>    # limit virtual memory

- get nutcracker stats
  printf "" | socat  - TCP:localhost:22222 | tee stats.txt
  printf "" | nc localhost 22222 | python -mjson.tool

- Signalling and Logging
  SIGTTIN - To up the log level
  SIGTTOU - To down the log level
  SIGHUP  - To reopen log file

- Error codes:
  http://www.cs.utah.edu/dept/old/texinfo/glibc-manual-0.02/library_2.html
  /usr/include/asm-generic/errno-base.h
  /usr/include/asm-generic/errno.h

- epoll (linux)

  union epoll_data {
      void *ptr;
      int fd;
      uint32_t u32;
      uint64_t u64;
  };

  struct epoll_event {
      uint32_t          events;  /* epoll events */
      struct epoll_data data;    /* user data variable */
  };

  /* events */
  EPOLLIN       = 0x001,
  EPOLLPRI      = 0x002,
  EPOLLOUT      = 0x004,
  EPOLLERR      = 0x008,
  EPOLLHUP      = 0x010,
  EPOLLRDNORM   = 0x040,
  EPOLLRDBAND   = 0x080,
  EPOLLWRNORM   = 0x100,
  EPOLLWRBAND   = 0x200,
  EPOLLMSG      = 0x400,
  EPOLLRDHUP    = 0x2000,
  EPOLLONESHOT  = (1 << 30),
  EPOLLET       = (1 << 31)

  /* opcodes */
  EPOLL_CTL_ADD = 1 /* add a file decriptor to the interface */
  EPOLL_CTL_DEL = 2 /* remove a file decriptor from the interface */
  EPOLL_CTL_MOD = 3 /* change file decriptor epoll_event structure */

- kqueue (bsd)

  struct kevent {
      uintptr_t   ident;    /* identifier for this event */
      int16_t     filter;   /* filter for event */
      uint16_t    flags;    /* general flags */
      uint32_t    fflags;   /* filter-specific flags */
      intptr_t    data;     /* filter-specific data */
      void        *udata;   /* opaque user data identifier */
  };

  /* flags / events */
  EV_ADD        = 0x0001    /* action - add event to kq (implies enable) */
  EV_DELETE     = 0x0002    /* action - delete event from kq */
  EV_ENABLE     = 0x0004    /* action - enable event */
  EV_DISABLE    = 0x0008    /* action - disable event (not reported) */
  EV_RECEIPT    = 0x0040    /* action - force EV_ERROR on success, data == 0 */

  EV_ONESHOT    = 0x0010    /* flags - only report one occurrence */
  EV_CLEAR      = 0x0020    /* flags - clear event state after reporting */
  EV_DISPATCH   = 0x0080    /* flags - disable event after reporting */
  EV_SYSFLAGS   = 0xF000    /* flags - reserved by system */
  EV_FLAG0      = 0x1000    /* flags - filter-specific flag */
  EV_FLAG1      = 0x2000    /* flags - filter-specific flag */

  EV_EOF        = 0x8000    /* returned values - EOF detected */
  EV_ERROR      = 0x4000    /* returned values - error, data contains errno */

  /* filters */
  EVFILT_READ       (-1)    /* readable */
  EVFILT_WRITE      (-2)    /* writable */
  EVFILT_AIO        (-3)    /* attached to aio requests */
  EVFILT_VNODE      (-4)    /* attached to vnodes */
  EVFILT_PROC       (-5)    /* attached to struct proc */
  EVFILT_SIGNAL     (-6)    /* attached to struct proc */
  EVFILT_TIMER      (-7)    /* timers */
  EVFILT_MACHPORT   (-8)    /* mach portsets */
  EVFILT_FS         (-9)    /* filesystem events */
  EVFILT_USER       (-10)   /* user events */
  EVFILT_VM         (-12)   /* virtual memory events */

  EV_CLEAR behaves like EPOLLET because it resets the event after it is
  returned; without this flag, the event would be repeatedly returned.

- poll (unix)

  POLLIN       0x001    /* there is data to read */
  POLLPRI      0x002    /* there is urgent data to read */
  POLLOUT      0x004    /* writing now will not block */

  POLLRDNORM   0x040    /* normal data may be read */
  POLLRDBAND   0x080    /* priority data may be read */
  POLLWRNORM   0x100    /* writing now will not block */
  POLLWRBAND   0x200    /* priority data may be written */

  POLLMSG      0x400
  POLLREMOVE  0x1000
  POLLRDHUP   0x2000

  POLLERR	   0x008    /* error condition */
  POLLHUP      0x010    /* hung up */
  POLLNVAL     0x020    /* invalid polling request */

- event ports (solaris)

  typedef struct port_event {
      int         portev_events;  /* event data is source specific */
      ushort_t    portev_source;  /* event source */
      ushort_t    portev_pad;     /* port internal use */
      uintptr_t   portev_object;  /* source specific object */
      void        *portev_user;   /* user cookie */
  } port_event_t;

  /* port sources */
  PORT_SOURCE_AIO     1
  PORT_SOURCE_TIMER   2
  PORT_SOURCE_USER    3
  PORT_SOURCE_FD      4
  PORT_SOURCE_ALERT   5
  PORT_SOURCE_MQ      6
  PORT_SOURCE_FILE    7


================================================
FILE: notes/socket.txt
================================================
- int listen(int sockfd, int backlog);

  Linux: The  backlog  argument defines the maximum length to which the
  queue of pending connections for sockfd may grow.  If a connection
  request arrives when the queue is full, the client may receive an error
  with an indication of ECONNREFUSED or, if the underlying protocol
  supports retransmission, the request may be ignored so that a later
  reattempt at connection succeeds.

  backlog specifies the queue length for completely established sockets
  waiting to be accepted, instead of the number of incomplete connection
  requests. The maximum length of the queue for incomplete sockets can
  be set using /proc/sys/net/ipv4/tcp_max_syn_backlog.

  If the backlog argument is greater than the value in /proc/sys/net/core/somaxconn,
  then it is silently truncated to that value; the default value in this
  file is 128.  In kernels before 2.4.25, this limit was a hard coded value,
  SOMAXCONN, with the value 128.

  BSD: The backlog argument defines the maximum length the queue of pending
  connections may grow to.  The real maximum queue length will be 1.5 times
  more than the value specified in the backlog argument.  A subsequent
  listen() system call on the listening socket allows the caller to change
  the maximum queue length using a new backlog argument.  If a connection
  request arrives with the queue full the client may receive an error with
  an indication of ECONNREFUSED, or, in the case of TCP, the connection
  will be silently dropped.

  The listen() system call appeared in 4.2BSD.  The ability to configure
  the maximum backlog at run-time, and to use a negative backlog to request
  the maximum allowable value, was introduced in FreeBSD 2.2.

- SO_LINGER (linger) socket option

  This option specifies what should happen when the socket of a type that
  promises reliable delivery still has untransmitted messages when it is
  closed

  struct linger {
      int l_onoff;  /* nonzero to linger on close  */
      int l_linger; /* time to linger (in secs)  */
  };

  l_onoff = 0 (default), then l_linger value is ignored and close returns
  immediately. But if there is any data still remaining in the socket send
  buffer, the system will try to deliver the data to the peer

  l_onoff = nonzero, then close blocks until data is transmitted or the
  l_linger timeout period expires
  a) l_linger = 0, TCP aborts connection, discards any data still remaining
     in the socket send buffer and sends RST to peer. This avoids the
     TCP's TIME_WAIT state
  b) l_linger = nonzero, then kernel will linger when socket is closed. If
     there is any pending data in the socket send buffer, the kernel waits
     until all the data is sent and acknowledged by peer TCP, or the
     linger time expires

  If a socket is set as nonblocking, it will not wait for close to complete
  even if linger time is nonzero

- TIME_WAIT state

  The end that performs active close i.e. the end that sends the first FIN
  goes into TIME_WAIT state. After a FIN packet is sent to the peer and
  after that peers FIN/ACK arrvies and is ACKed, we go into a TIME_WAIT
  state. The duration that the end point remains in this state is 2 x MSL
  (maximum segment lifetime). The reason that the duration of the TIME_WAIT
  state is 2 x MSL is because the maximum amount of time a packet can wander
  around a network is assumed to be MSL seconds. The factor of 2 is for the
  round-trip. The recommended value for MSL is 120 seconds, but Berkeley
  derived implementations normally use 30 seconds instead. This means a
  TIME_WAIT delay is between 1 and 4 minutes.

  For Linux, the TIME_WAIT state duration is 1 minute (net/tcp.h):
  #define TCP_TIMEWAIT_LEN (60*HZ) /* how long to wait to destroy TIME-WAIT
                                    * state, about 60 seconds */

  TIME_WAIT state on client, combined with limited number of ephermeral ports
  available for TCP connections severely limits the rate at which new
  connections to the server can be created. On Linux, by default ephemeral
  ports are in the range of 32768 to 61000:

  $ cat /proc/sys/net/ipv4/ip_local_port_range
  32768 61000

  So with a TIME_WAIT state duration of 1 minute, the maximum sustained rate
  for any client is ~470 new connections per second

- TCP keepalive

  TCP keepalive packet (TCP packet with no data and the ACK flag turned on)
  is used to assert that connection is still up and running. This is useful
  because if the remote peer goes away without closing their connection, the
  keepalive probe will detect this and notice that the connection is broken
  even if there is no traffic on it.

  Imagine, the following scenario: You have a valid TCP connection established
  between two endpoints A and B. B terminates abnormally (think kernel panic
  or unplugging of network cable) without sending anything over the network
  to notify A that connection is broken. A, from its side, is ready to
  receive data, and has no idea that B has gone away. Now B comes back up
  again, and while A knows about a connection with B and still thinks that it
  active, B has no such idea. A tries to send data to B over a dead
  connection, and B replies with an RST packet, causing A to finally close
  the connection. So, without a keepalive probe A would never close the
  connection if it never sent data over it.

- There are four socket functions that pass a socket address structure from
  the process to the kernel - bind, connect, sendmsg and sendto. These
  function are also responsible for passing the length of the sockaddr that
  they are passing (socklen_t).
  There are five socket functions that pass a socket from the kernel to the
  process - accept, recvfrom, recvmsg, getpeername, getsockname. The kernel
  is also responsible for returning the length of the sockaddr struct that
  it returns back to the userspace

  Different sockaddr structs:
  1. sockaddr_in
  2. sockaddr_in6
  3. sockaddr_un

  Special types of in_addr_t
  /* Address to accept any incoming messages */
  #define INADDR_ANY ((in_addr_t) 0x00000000)

  /* Address to send to all hosts */
  #define INADDR_BROADCAST ((in_addr_t) 0xffffffff)

  /* Address indicating an error return */
  #define INADDR_NONE ((in_addr_t) 0xffffffff)


================================================
FILE: scripts/.gitignore
================================================
*.pyc
*.out
*.log


================================================
FILE: src/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CPPFLAGS =
if !OS_SOLARIS
AM_CPPFLAGS += -D_GNU_SOURCE
endif
AM_CPPFLAGS += -I $(top_srcdir)/dep/dhashkit
AM_CPPFLAGS += -I $(top_srcdir)/dep/ae
AM_CPPFLAGS += -I $(top_srcdir)/dep/util
AM_CPPFLAGS += -I $(top_srcdir)/dep/jemalloc-4.2.0/include
AM_CPPFLAGS += -I $(top_srcdir)/dep/dmalloc
AM_CPPFLAGS += -I $(top_srcdir)/dep/sds
AM_CPPFLAGS += -I $(top_srcdir)/dep/darray
AM_CPPFLAGS += -I $(top_srcdir)/dep/dlist

AM_CFLAGS = 
AM_CFLAGS += -fno-strict-aliasing
AM_CFLAGS += -Wall -Wshadow
AM_CFLAGS += -Wpointer-arith
AM_CFLAGS += -Winline
AM_CFLAGS += -Wunused-function -Wunused-variable -Wunused-value
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value
AM_CFLAGS += -Wconversion -Wsign-compare
AM_CFLAGS += -Wstrict-prototypes -Wmissing-prototypes -Wredundant-decls -Wmissing-declarations

AM_LDFLAGS =
AM_LDFLAGS += -lm -lpthread -rdynamic
if !OS_DARWIN
AM_LDFLAGS += -lrt
endif
if OS_SOLARIS
AM_LDFLAGS += -lnsl -lsocket
endif
if OS_FREEBSD
AM_LDFLAGS += -lexecinfo
endif

sbin_PROGRAMS = vire

vire_SOURCES =                          \
    vr_aof.c vr_aof.h                   \
    vr_block.c vr_block.h               \
    vr_client.c vr_client.h             \
    vr_command.c vr_command.h           \
    vr_conf.c vr_conf.h                 \
    vr_connection.c vr_connection.h     \
    vr_core.c vr_core.h                 \
    vr_db.c vr_db.h                     \
    vr_dict.c vr_dict.h                 \
    vr_eventloop.c vr_eventloop.h       \
    vr_intset.c vr_intset.h             \
    vr_listen.c vr_listen.h             \
    vr_lzf.h vr_lzfP.h                  \
    vr_lzf_c.c vr_lzf_d.c               \
    vr_master.c vr_master.h             \
    vr_multi.c vr_multi.h               \
    vr_notify.c vr_notify.h             \
    vr_object.c vr_object.h             \
    vr_pubsub.c vr_pubsub.h             \
    vr_quicklist.c vr_quicklist.h       \
    vr_rbtree.c vr_rbtree.h             \
    vr_rdb.c vr_rdb.h                   \
    vr_replication.c vr_replication.h   \
    vr_scripting.c vr_scripting.h       \
    vr_server.c vr_server.h             \
    vr_signal.c vr_signal.h             \
    vr_slowlog.c vr_slowlog.h           \
    vr_specialconfig.h                  \
    vr_stats.c vr_stats.h               \
    vr_thread.c vr_thread.h             \
    vr_t_hash.c vr_t_hash.h             \
    vr_t_list.c vr_t_list.h             \
    vr_t_set.c vr_t_set.h               \
    vr_t_string.c vr_t_string.h         \
    vr_t_zset.c vr_t_zset.h             \
    vr_util.c vr_util.h                 \
    vr_worker.c vr_worker.h             \
    vr_backend.c vr_backend.h           \
    vr_ziplist.c vr_ziplist.h           \
    vr_zipmap.c vr_zipmap.h             \
    vr_bitops.c vr_bitops.h             \
    vr_hyperloglog.c vr_hyperloglog.h   \
    vr.c
    
vire_LDADD = $(top_builddir)/dep/util/libdutil.a
vire_LDADD += $(top_builddir)/dep/ae/libae.a
vire_LDADD += $(top_builddir)/dep/sds/libsds.a
vire_LDADD += $(top_builddir)/dep/darray/libdarray.a
vire_LDADD += $(top_builddir)/dep/dlist/libdlist.a
vire_LDADD += $(top_builddir)/dep/dhashkit/libdhashkit.a
vire_LDADD += $(top_builddir)/dep/jemalloc-4.2.0/lib/libjemalloc.a
vire_LDADD += $(top_builddir)/dep/dmalloc/libdmalloc.a

================================================
FILE: src/vr.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <signal.h>
#include <getopt.h>
#include <fcntl.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <vr_core.h>
#include <vr_conf.h>
#include <vr_signal.h>

#define VR_CONF_PATH        "conf/vire.conf"

#define VR_LOG_DEFAULT      LOG_NOTICE
#define VR_LOG_MIN          LOG_EMERG
#define VR_LOG_MAX          LOG_PVERB
#define VR_LOG_PATH         NULL

#define VR_PORT             8889
#define VR_ADDR             "0.0.0.0"
#define VR_INTERVAL         (30 * 1000) /* in msec */

#define VR_PID_FILE         NULL

#define VR_THREAD_NUM_DEFAULT	(sysconf(_SC_NPROCESSORS_ONLN)>6?6:sysconf(_SC_NPROCESSORS_ONLN))

static int show_help;
static int show_version;
static int test_conf;
static int daemonize;

static struct option long_options[] = {
    { "help",           no_argument,        NULL,   'h' },
    { "version",        no_argument,        NULL,   'V' },
    { "test-conf",      no_argument,        NULL,   't' },
    { "daemonize",      no_argument,        NULL,   'd' },
    { "verbose",        required_argument,  NULL,   'v' },
    { "output",         required_argument,  NULL,   'o' },
    { "conf-file",      required_argument,  NULL,   'c' },
    { "pid-file",       required_argument,  NULL,   'p' },
    { "thread-num",     required_argument,  NULL,   'T' },
    { NULL,             0,                  NULL,    0  }
};

static char short_options[] = "hVtdv:o:c:p:T:";

static rstatus_t
vr_daemonize(int dump_core)
{
    rstatus_t status;
    pid_t pid, sid;
    int fd;

    pid = fork();
    switch (pid) {
    case -1:
        log_error("fork() failed: %s", strerror(errno));
        return VR_ERROR;

    case 0:
        break;

    default:
        /* parent terminates */
        _exit(0);
    }

    /* 1st child continues and becomes the session leader */

    sid = setsid();
    if (sid < 0) {
        log_error("setsid() failed: %s", strerror(errno));
        return VR_ERROR;
    }

    if (signal(SIGHUP, SIG_IGN) == SIG_ERR) {
        log_error("signal(SIGHUP, SIG_IGN) failed: %s", strerror(errno));
        return VR_ERROR;
    }

    pid = fork();
    switch (pid) {
    case -1:
        log_error("fork() failed: %s", strerror(errno));
        return VR_ERROR;

    case 0:
        break;

    default:
        /* 1st child terminates */
        _exit(0);
    }

    /* 2nd child continues */

    /* change working directory */
    if (dump_core == 0) {
        status = chdir("/");
        if (status < 0) {
            log_error("chdir(\"/\") failed: %s", strerror(errno));
            return VR_ERROR;
        }
    }

    /* clear file mode creation mask */
    umask(0);

    /* redirect stdin, stdout and stderr to "/dev/null" */

    fd = open("/dev/null", O_RDWR);
    if (fd < 0) {
        log_error("open(\"/dev/null\") failed: %s", strerror(errno));
        return VR_ERROR;
    }

    status = dup2(fd, STDIN_FILENO);
    if (status < 0) {
        log_error("dup2(%d, STDIN) failed: %s", fd, strerror(errno));
        close(fd);
        return VR_ERROR;
    }

    status = dup2(fd, STDOUT_FILENO);
    if (status < 0) {
        log_error("dup2(%d, STDOUT) failed: %s", fd, strerror(errno));
        close(fd);
        return VR_ERROR;
    }

    status = dup2(fd, STDERR_FILENO);
    if (status < 0) {
        log_error("dup2(%d, STDERR) failed: %s", fd, strerror(errno));
        close(fd);
        return VR_ERROR;
    }

    if (fd > STDERR_FILENO) {
        status = close(fd);
        if (status < 0) {
            log_error("close(%d) failed: %s", fd, strerror(errno));
            return VR_ERROR;
        }
    }

    return VR_OK;
}

static void
vr_print_run(struct instance *nci)
{
    int status;
    struct utsname name;

    status = uname(&name);

    if (nci->log_filename) {
        char *ascii_logo =
"                _._                                                  \n"
"           _.-``__ ''-._                                             \n"
"      _.-``    `.  *_.  ''-._           Vire %s %s bit\n"
"  .-`` .-```.  ```\-/    _.,_ ''-._                                   \n"
" (    |      |       .-`    `,    )     Running in %s mode\n"
" |`-._`-...-` __...-.``-._;'` _.-'|     Port: %d\n"
" |    `-._   `._    /     _.-'    |     PID: %ld\n"
"  `-._    `-._  `-./  _.-'    _.-'      OS: %s %s %s\n"
" |`-._`-._    `-.__.-'    _.-'_.-'|                                  \n"
" |    `-._`-._        _.-'_.-'    |     https://github.com/vipshop/vire\n"
"  `-._    `-._`-.__.-'_.-'    _.-'                                   \n"
" |`-._`-._    `-.__.-'    _.-'_.-'|                                  \n"
" |    `-._`-._        _.-'_.-'    |                                  \n"
"  `-._    `-._`-.__.-'_.-'    _.-'                                   \n"
"      `-._    `-.__.-'    _.-'                                       \n"
"          `-._        _.-'                                           \n"
"              `-.__.-'                                               \n\n";
        char *buf = dalloc(1024*16);
        snprintf(buf,1024*16,ascii_logo,
            VR_VERSION_STRING,
            (sizeof(long) == 8) ? "64" : "32",
            "standalone", server.port,
            (long) nci->pid,
            status < 0 ? " ":name.sysname,
            status < 0 ? " ":name.release,
            status < 0 ? " ":name.machine);
        log_write_len(buf, strlen(buf));
        dfree(buf);
    }else {
        char buf[256];
        snprintf(buf,256,"Vire %s, %s bit, %s mode, port %d, pid %ld, built for %s %s %s ready to run.\n",
            VR_VERSION_STRING, (sizeof(long) == 8) ? "64" : "32",
            "standalone", server.port, (long) nci->pid,
            status < 0 ? " ":name.sysname,
            status < 0 ? " ":name.release,
            status < 0 ? " ":name.machine);
        log_write_len(buf, strlen(buf));
    }
}

static void
vr_print_done(void)
{
    loga("done, rabbit done");
}

static void
vr_show_usage(void)
{
    log_stderr(
        "Usage: vire [-?hVdt] [-v verbosity level] [-o output file]" CRLF
        "            [-c conf file] [-p pid file]" CRLF
        "            [-T worker threads number]" CRLF
        "");
    log_stderr(
        "Options:" CRLF
        "  -h, --help             : this help" CRLF
        "  -V, --version          : show version and exit" CRLF
        "  -t, --test-conf        : test configuration for syntax errors and exit" CRLF
        "  -d, --daemonize        : run as a daemon");
    log_stderr(
        "  -v, --verbose=N        : set logging level (default: %d, min: %d, max: %d)" CRLF
        "  -o, --output=S         : set logging file (default: %s)" CRLF
        "  -c, --conf-file=S      : set configuration file (default: %s)" CRLF
        "  -p, --pid-file=S       : set pid file (default: %s)" CRLF
        "  -T, --thread_num=N     : set the worker threads number (default: %d)" CRLF
        "",
        VR_LOG_DEFAULT, VR_LOG_MIN, VR_LOG_MAX,
        VR_LOG_PATH != NULL ? VR_LOG_PATH : "stderr",
        VR_CONF_PATH,
        VR_PID_FILE != NULL ? VR_PID_FILE : "off",
        VR_THREAD_NUM_DEFAULT);
}

static rstatus_t
vr_create_pidfile(struct instance *nci)
{
    char pid[VR_UINTMAX_MAXLEN];
    int fd, pid_len;
    ssize_t n;

    fd = open(nci->pid_filename, O_WRONLY | O_CREAT | O_TRUNC, 0644);
    if (fd < 0) {
        log_error("opening pid file '%s' failed: %s", nci->pid_filename,
                  strerror(errno));
        return VR_ERROR;
    }
    nci->pidfile = 1;

    pid_len = dsnprintf(pid, VR_UINTMAX_MAXLEN, "%d", nci->pid);

    n = vr_write(fd, pid, pid_len);
    if (n < 0) {
        log_error("write to pid file '%s' failed: %s", nci->pid_filename,
                  strerror(errno));
        return VR_ERROR;
    }

    close(fd);

    return VR_OK;
}

static void
vr_remove_pidfile(struct instance *nci)
{
    int status;

    status = unlink(nci->pid_filename);
    if (status < 0) {
        log_error("unlink of pid file '%s' failed, ignored: %s",
                  nci->pid_filename, strerror(errno));
    }
}

static void
vr_set_default_options(struct instance *nci)
{
    int status;

    nci->log_level = VR_LOG_DEFAULT;
    nci->log_filename = VR_LOG_PATH;

    nci->conf_filename = VR_CONF_PATH;

    status = vr_gethostname(nci->hostname, VR_MAXHOSTNAMELEN);
    if (status < 0) {
        log_warn("gethostname failed, ignored: %s", strerror(errno));
        dsnprintf(nci->hostname, VR_MAXHOSTNAMELEN, "unknown");
    }
    nci->hostname[VR_MAXHOSTNAMELEN - 1] = '\0';

    nci->pid = (pid_t)-1;
    nci->pid_filename = NULL;
    nci->pidfile = 0;

    nci->thread_num = (int)VR_THREAD_NUM_DEFAULT;
}

static rstatus_t
vr_get_options(int argc, char **argv, struct instance *nci)
{
    int c, value;

    opterr = 0;

    for (;;) {
        c = getopt_long(argc, argv, short_options, long_options, NULL);
        if (c == -1) {
            /* no more options */
            break;
        }

        switch (c) {
        case 'h':
            show_version = 1;
            show_help = 1;
            break;

        case 'V':
            show_version = 1;
            break;

        case 't':
            test_conf = 1;
            break;

        case 'd':
            daemonize = 1;
            break;

        case 'v':
            value = vr_atoi(optarg, strlen(optarg));
            if (value < 0) {
                log_stderr("vire: option -v requires a number");
                return VR_ERROR;
            }
            nci->log_level = value;
            break;

        case 'o':
            nci->log_filename = optarg;
            break;

        case 'c':
            nci->conf_filename = optarg;
            break;

        case 'p':
            nci->pid_filename = optarg;
            break;
            
        case 'T':
            value = vr_atoi(optarg, strlen(optarg));
            if (value < 0) {
                log_stderr("vire: option -T requires a number");
                return VR_ERROR;
            }

            nci->thread_num = value;
            break;

        case '?':
            switch (optopt) {
            case 'o':
            case 'c':
            case 'p':
                log_stderr("vire: option -%c requires a file name",
                           optopt);
                break;

            case 'v':
            case 'T':
                log_stderr("vire: option -%c requires a number", optopt);
                break;

            default:
                log_stderr("vire: invalid option -- '%c'", optopt);
                break;
            }
            return VR_ERROR;

        default:
            log_stderr("vire: invalid option -- '%c'", optopt);
            return VR_ERROR;

        }
    }

    return VR_OK;
}

/*
 * Returns true if configuration file has a valid syntax, otherwise
 * returns false
 */
static bool
vr_test_conf(struct instance *nci, int test)
{
    vr_conf *cf;

    cf = conf_create(nci->conf_filename);
    if (cf == NULL) {
        if (test)
            log_stderr("vire: configuration file '%s' syntax is invalid",
                nci->conf_filename);
        return false;
    }

    conf_destroy(cf);

    if (test)
        log_stderr("vire: configuration file '%s' syntax is ok",
            nci->conf_filename);
    return true;
}

static int
vr_pre_run(struct instance *nci)
{
    int ret;

    ret = log_init(nci->log_level, nci->log_filename);
    if (ret != VR_OK) {
        return ret;
    }

    log_debug(LOG_VERB, "Vire used logfile: %s", nci->conf_filename);

    if (!vr_test_conf(nci, false)) {
        log_error("conf file %s is error", nci->conf_filename);
        return VR_ERROR;
    }

    if (daemonize) {
        ret = vr_daemonize(1);
        if (ret != VR_OK) {
            return ret;
        }
    }

    nci->pid = getpid();

    ret = signal_init();
    if (ret != VR_OK) {
        return ret;
    }

    if (nci->pid_filename) {
        ret = vr_create_pidfile(nci);
        if (ret != VR_OK) {
            return VR_ERROR;
        }
    }

    ret = init_server(nci);
    if (ret != VR_OK) {
        return VR_ERROR;
    }

    vr_print_run(nci);

    return VR_OK;
}

static void
vr_post_run(struct instance *nci)
{
    /* deinit the threads */
    workers_deinit();
    backends_deinit();
    master_deinit();
    
    if (nci->pidfile) {
        vr_remove_pidfile(nci);
    }

    signal_deinit();

    vr_print_done();

    log_deinit();
}

static void
vr_run(struct instance *nci)
{
    if (nci->thread_num <= 0) {
        log_error("number of work threads must be greater than 0");
        return;
    } else if (nci->thread_num > 64) {
        log_warn("WARNING: Setting a high number of worker threads is not recommended."
            " Set this value to the number of cores in your machine or less.");
    }

    /* run the threads */
    master_run();
    workers_run();
    backends_run();

    /* wait for the threads finish */
    workers_wait();
    backends_wait();
}

int
main(int argc, char **argv)
{
    rstatus_t status;
    struct instance nci;

    vr_set_default_options(&nci);

    status = vr_get_options(argc, argv, &nci);
    if (status != VR_OK) {
        vr_show_usage();
        exit(1);
    }

    if (show_version) {
        log_stderr("This is vire-%s" CRLF, VR_VERSION_STRING);
        if (show_help) {
            vr_show_usage();
        }
        exit(0);
    }

    if (test_conf) {
        if (!vr_test_conf(&nci, true)) {
            exit(1);
        }
        exit(0);
    }

    status = vr_pre_run(&nci);
    if (status != VR_OK) {
        vr_post_run(&nci);
        exit(1);
    }

    server.executable = getAbsolutePath(argv[0]);

    vr_run(&nci);

    vr_post_run(&nci);

    return VR_OK;
}


================================================
FILE: src/vr_aof.c
================================================
#include <vr_core.h>

/* Return the current size of the AOF rewrite buffer. */
unsigned long aofRewriteBufferSize(void) {
    dlistNode *ln;
    dlistIter li;
    unsigned long size = 0;

    dlistRewind(server.aof_rewrite_buf_blocks,&li);
    while((ln = dlistNext(&li))) {
        aofrwblock *block = dlistNodeValue(ln);
        size += block->used;
    }
    return size;
}

/* Create the sds representation of an PEXPIREAT command, using
 * 'seconds' as time to live and 'cmd' to understand what command
 * we are translating into a PEXPIREAT.
 *
 * This command is used in order to translate EXPIRE and PEXPIRE commands
 * into PEXPIREAT command so that we retain precision in the append only
 * file, and the time is always absolute and not relative. */
sds catAppendOnlyExpireAtCommand(sds buf, struct redisCommand *cmd, robj *key, robj *seconds) {
    long long when;
    robj *argv[3];

    /* Make sure we can use strtoll */
    seconds = getDecodedObject(seconds);
    when = strtoll(seconds->ptr,NULL,10);
    /* Convert argument into milliseconds for EXPIRE, SETEX, EXPIREAT */
    if (cmd->proc == expireCommand || cmd->proc == setexCommand ||
        cmd->proc == expireatCommand)
    {
        when *= 1000;
    }
    /* Convert into absolute time for EXPIRE, PEXPIRE, SETEX, PSETEX */
    if (cmd->proc == expireCommand || cmd->proc == pexpireCommand ||
        cmd->proc == setexCommand || cmd->proc == psetexCommand)
    {
        when += vr_msec_now();
    }
    decrRefCount(seconds);

    argv[0] = createStringObject("PEXPIREAT",9);
    argv[1] = key;
    argv[2] = createStringObjectFromLongLong(when);
    buf = catAppendOnlyGenericCommand(buf, 3, argv);
    decrRefCount(argv[0]);
    decrRefCount(argv[2]);
    return buf;
}

sds catAppendOnlyGenericCommand(sds dst, int argc, robj **argv) {
    char buf[32];
    int len, j;
    robj *o;

    buf[0] = '*';
    len = 1+ll2string(buf+1,sizeof(buf)-1,argc);
    buf[len++] = '\r';
    buf[len++] = '\n';
    dst = sdscatlen(dst,buf,len);

    for (j = 0; j < argc; j++) {
        o = getDecodedObject(argv[j]);
        buf[0] = '$';
        len = 1+ll2string(buf+1,sizeof(buf)-1,sdslen(o->ptr));
        buf[len++] = '\r';
        buf[len++] = '\n';
        dst = sdscatlen(dst,buf,len);
        dst = sdscatlen(dst,o->ptr,sdslen(o->ptr));
        dst = sdscatlen(dst,"\r\n",2);
        decrRefCount(o);
    }
    return dst;
}

/* Event handler used to send data to the child process doing the AOF
 * rewrite. We send pieces of our AOF differences buffer so that the final
 * write when the child finishes the rewrite will be small. */
void aofChildWriteDiffData(aeEventLoop *el, int fd, void *privdata, int mask) {
    dlistNode *ln;
    aofrwblock *block;
    ssize_t nwritten;
    UNUSED(el);
    UNUSED(fd);
    UNUSED(privdata);
    UNUSED(mask);

    while(1) {
        ln = dlistFirst(server.aof_rewrite_buf_blocks);
        block = ln ? ln->value : NULL;
        if (server.aof_stop_sending_diff || !block) {
            aeDeleteFileEvent(server.el,server.aof_pipe_write_data_to_child,
                              AE_WRITABLE);
            return;
        }
        if (block->used > 0) {
            nwritten = vr_write(server.aof_pipe_write_data_to_child,
                             block->buf,block->used);
            if (nwritten <= 0) return;
            memmove(block->buf,block->buf+nwritten,block->used-nwritten);
            block->used -= nwritten;
        }
        if (block->used == 0) dlistDelNode(server.aof_rewrite_buf_blocks,ln);
    }
}

/* Append data to the AOF rewrite buffer, allocating new blocks if needed. */
void aofRewriteBufferAppend(unsigned char *s, unsigned long len) {
    dlistNode *ln = dlistLast(server.aof_rewrite_buf_blocks);
    aofrwblock *block = ln ? ln->value : NULL;

    while(len) {
        /* If we already got at least an allocated block, try appending
         * at least some piece into it. */
        if (block) {
            unsigned long thislen = (block->free < len) ? block->free : len;
            if (thislen) {  /* The current block is not already full. */
                memcpy(block->buf+block->used, s, thislen);
                block->used += thislen;
                block->free -= thislen;
                s += thislen;
                len -= thislen;
            }
        }

        if (len) { /* First block to allocate, or need another block. */
            int numblocks;

            block = dalloc(sizeof(*block));
            block->free = AOF_RW_BUF_BLOCK_SIZE;
            block->used = 0;
            dlistAddNodeTail(server.aof_rewrite_buf_blocks,block);

            /* Log every time we cross more 10 or 100 blocks, respectively
             * as a notice or warning. */
            numblocks = dlistLength(server.aof_rewrite_buf_blocks);
            if (((numblocks+1) % 10) == 0) {
                int level = ((numblocks+1) % 100) == 0 ? LOG_WARN :
                                                         LOG_NOTICE;
                log_debug(level, "Background AOF buffer size: %lu MB",
                    aofRewriteBufferSize()/(1024*1024));
            }
        }
    }

    /* Install a file event to send data to the rewrite child if there is
     * not one already. */
    if (aeGetFileEvents(server.el,server.aof_pipe_write_data_to_child) == 0) {
        aeCreateFileEvent(server.el, server.aof_pipe_write_data_to_child,
            AE_WRITABLE, aofChildWriteDiffData, NULL);
    }
}

void feedAppendOnlyFile(struct redisCommand *cmd, int dictid, robj **argv, int argc) {
    sds buf = sdsempty();
    robj *tmpargv[3];

    /* The DB this command was targeting is not the same as the last command
     * we appended. To issue a SELECT command is needed. */
    if (dictid != server.aof_selected_db) {
        char seldb[64];

        snprintf(seldb,sizeof(seldb),"%d",dictid);
        buf = sdscatprintf(buf,"*2\r\n$6\r\nSELECT\r\n$%lu\r\n%s\r\n",
            (unsigned long)strlen(seldb),seldb);
        server.aof_selected_db = dictid;
    }

    if (cmd->proc == expireCommand || cmd->proc == pexpireCommand ||
        cmd->proc == expireatCommand) {
        /* Translate EXPIRE/PEXPIRE/EXPIREAT into PEXPIREAT */
        buf = catAppendOnlyExpireAtCommand(buf,cmd,argv[1],argv[2]);
    } else if (cmd->proc == setexCommand || cmd->proc == psetexCommand) {
        /* Translate SETEX/PSETEX to SET and PEXPIREAT */
        tmpargv[0] = createStringObject("SET",3);
        tmpargv[1] = argv[1];
        tmpargv[2] = argv[3];
        buf = catAppendOnlyGenericCommand(buf,3,tmpargv);
        decrRefCount(tmpargv[0]);
        buf = catAppendOnlyExpireAtCommand(buf,cmd,argv[1],argv[2]);
    } else {
        /* All the other commands don't need translation or need the
         * same translation already operated in the command vector
         * for the replication itself. */
        buf = catAppendOnlyGenericCommand(buf,argc,argv);
    }

    /* Append to the AOF buffer. This will be flushed on disk just before
     * of re-entering the event loop, so before the client will get a
     * positive reply about the operation performed. */
    if (server.aof_state == AOF_ON)
        server.aof_buf = sdscatlen(server.aof_buf,buf,sdslen(buf));

    /* If a background append only file rewriting is in progress we want to
     * accumulate the differences between the child DB and the current one
     * in a buffer, so that when the child process will do its work we
     * can append the differences to the new append only file. */
    if (server.aof_child_pid != -1)
        aofRewriteBufferAppend((unsigned char*)buf,sdslen(buf));

    sdsfree(buf);
}


================================================
FILE: src/vr_aof.h
================================================
#ifndef _VR_AOF_H_
#define _VR_AOF_H_

/* AOF states */
#define AOF_OFF 0             /* AOF is off */
#define AOF_ON 1              /* AOF is on */
#define AOF_WAIT_REWRITE 2    /* AOF waits rewrite to start appending */

#define AOF_AUTOSYNC_BYTES (1024*1024*32) /* fdatasync every 32MB */

/* ----------------------------------------------------------------------------
 * AOF rewrite buffer implementation.
 *
 * The following code implement a simple buffer used in order to accumulate
 * changes while the background process is rewriting the AOF file.
 *
 * We only need to append, but can't just use realloc with a large block
 * because 'huge' reallocs are not always handled as one could expect
 * (via remapping of pages at OS level) but may involve copying data.
 *
 * For this reason we use a list of blocks, every block is
 * AOF_RW_BUF_BLOCK_SIZE bytes.
 * ------------------------------------------------------------------------- */

#define AOF_RW_BUF_BLOCK_SIZE (1024*1024*10)    /* 10 MB per block */

typedef struct aofrwblock {
    unsigned long used, free;
    char buf[AOF_RW_BUF_BLOCK_SIZE];
} aofrwblock;

unsigned long aofRewriteBufferSize(void);
void aofChildWriteDiffData(aeEventLoop *el, int fd, void *privdata, int mask);
sds catAppendOnlyExpireAtCommand(sds buf, struct redisCommand *cmd, robj *key, robj *seconds);
sds catAppendOnlyGenericCommand(sds dst, int argc, robj **argv);
void aofRewriteBufferAppend(unsigned char *s, unsigned long len);
void feedAppendOnlyFile(struct redisCommand *cmd, int dictid, robj **argv, int argc);

#endif


================================================
FILE: src/vr_backend.c
================================================
#include <vr_core.h>

/* Which thread we assigned a connection to most recently. */
static int num_backend_threads;

struct darray backends;

static void *backend_thread_run(void *args);

int
vr_backend_init(vr_backend *backend)
{
    rstatus_t status;
    int threads_num;
    
    if (backend == NULL) {
        return VR_ERROR;
    }

    backend->id = 0;
    backend->current_db = 0;
    backend->timelimit_exit = 0;
    backend->last_fast_cycle = 0;
    backend->resize_db = 0;
    backend->rehash_db = 0;

    vr_eventloop_init(&backend->vel, 10);
    backend->vel.thread.fun_run = backend_thread_run;
    backend->vel.thread.data = backend;
    
    return VR_OK;
}

void
vr_backend_deinit(vr_backend *backend)
{
    if (backend == NULL) {
        return;
    }

    vr_eventloop_deinit(&backend->vel);
}

static int
backend_cron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
    vr_worker *backend = clientData;
    vr_eventloop *vel = &backend->vel;
    size_t stat_used_memory, stats_peak_memory;

    UNUSED(eventLoop);
    UNUSED(id);
    UNUSED(clientData);

    ASSERT(eventLoop == vel->el);

    vel->unixtime = time(NULL);
    vel->mstime = vr_msec_now();

    /* Record the max memory used since the server was started. */
    stat_used_memory = dalloc_used_memory();
    update_stats_get(vel->stats, peak_memory, &stats_peak_memory);
    if (stat_used_memory > stats_peak_memory) {
        update_stats_set(vel->stats, peak_memory, stat_used_memory);
    }

    databasesCron(backend);

    /* Update the config cache */
    run_with_period(1000, vel->cronloops) {
        conf_cache_update(&vel->cc);
    }
    
    vel->cronloops ++;
    return 1000/vel->hz;
}

static int
setup_backend(vr_backend *backend)
{
    /* Create the serverCron() time event, that's our main way to process
     * background operations. */
    if(aeCreateTimeEvent(backend->vel.el, 1, backend_cron, backend, NULL) == AE_ERR) {
        serverPanic("Can't create the serverCron time event.");
        return VR_ERROR;
    }
    
    return VR_OK;
}

static void *
backend_thread_run(void *args)
{
    vr_worker *backend = args;
    
    /* vire worker run */
    aeMain(backend->vel.el);

    return NULL;
}

int
backends_init(uint32_t backend_count)
{
    rstatus_t status;
    uint32_t idx;
    vr_backend *backend;

    darray_init(&backends, backend_count, sizeof(vr_backend));

    for (idx = 0; idx < backend_count; idx ++) {
        backend = darray_push(&backends);
        vr_backend_init(backend);
        backend->id = idx;
        status = setup_backend(backend);
        if (status != VR_OK) {
            exit(1);
        }
    }
    
    num_backend_threads = (int)darray_n(&backends);

    return VR_OK;
}

int
backends_run(void)
{
    uint32_t i, thread_count;
    vr_backend *backend;

    thread_count = (uint32_t)num_backend_threads;

    for (i = 0; i < thread_count; i ++) {
        backend = darray_get(&backends, i);
        vr_thread_start(&backend->vel.thread);
    }

    return VR_OK;
}

int
backends_wait(void)
{
    uint32_t i, thread_count;
    vr_backend *backend;

    thread_count = (uint32_t)num_backend_threads;

    for (i = 0; i < thread_count; i ++) {
        backend = darray_get(&backends, i);
        pthread_join(backend->vel.thread.thread_id, NULL);
    }

    return VR_OK;
}

void
backends_deinit(void)
{
    vr_backend *backend;

    while(darray_n(&backends)) {
        backend = darray_pop(&backends);
		vr_backend_deinit(backend);
    }
}


================================================
FILE: src/vr_backend.h
================================================
#ifndef _VR_BACKEND_H_
#define _VR_BACKEND_H_

typedef struct vr_backend {

    int id;
    vr_eventloop vel;

    /* Some global state in order to continue the work incrementally 
       * across calls for activeExpireCycle() to expire some keys. */
    unsigned int current_db;    /* Last DB tested. */
    int timelimit_exit;         /* Time limit hit in previous call? */
    long long last_fast_cycle;  /* When last fast cycle ran. */

    /* We use global counters so if we stop the computation at a given
       * DB we'll be able to start from the successive in the next
       * cron loop iteration for databasesCron() to resize and reshash db. */
    unsigned int resize_db;
    unsigned int rehash_db;
}vr_backend;

extern struct darray backends;

int backends_init(uint32_t backend_count);
int backends_run(void);
int backends_wait(void);
void backends_deinit(void);

#endif


================================================
FILE: src/vr_bitops.c
================================================
#include <vr_core.h>

/* -----------------------------------------------------------------------------
 * Helpers and low level bit functions.
 * -------------------------------------------------------------------------- */

/* Count number of bits set in the binary array pointed by 's' and long
 * 'count' bytes. The implementation of this function is required to
 * work with a input string length up to 512 MB. */
size_t redisPopcount(void *s, long count) {
    size_t bits = 0;
    unsigned char *p = s;
    uint32_t *p4;
    static const unsigned char bitsinbyte[256] = {0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4,1,2,2,3,2,3,3,4,2,3,3,4,3,4,4,5,1,2,2,3,2,3,3,4,2,3,3,4,3,4,4,5,2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,1,2,2,3,2,3,3,4,2,3,3,4,3,4,4,5,2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,3,4,4,5,4,5,5,6,4,5,5,6,5,6,6,7,1,2,2,3,2,3,3,4,2,3,3,4,3,4,4,5,2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,3,4,4,5,4,5,5,6,4,5,5,6,5,6,6,7,2,3,3,4,3,4,4,5,3,4,4,5,4,5,5,6,3,4,4,5,4,5,5,6,4,5,5,6,5,6,6,7,3,4,4,5,4,5,5,6,4,5,5,6,5,6,6,7,4,5,5,6,5,6,6,7,5,6,6,7,6,7,7,8};

    /* Count initial bytes not aligned to 32 bit. */
    while((unsigned long)p & 3 && count) {
        bits += bitsinbyte[*p++];
        count--;
    }

    /* Count bits 28 bytes at a time */
    p4 = (uint32_t*)p;
    while(count>=28) {
        uint32_t aux1, aux2, aux3, aux4, aux5, aux6, aux7;

        aux1 = *p4++;
        aux2 = *p4++;
        aux3 = *p4++;
        aux4 = *p4++;
        aux5 = *p4++;
        aux6 = *p4++;
        aux7 = *p4++;
        count -= 28;

        aux1 = aux1 - ((aux1 >> 1) & 0x55555555);
        aux1 = (aux1 & 0x33333333) + ((aux1 >> 2) & 0x33333333);
        aux2 = aux2 - ((aux2 >> 1) & 0x55555555);
        aux2 = (aux2 & 0x33333333) + ((aux2 >> 2) & 0x33333333);
        aux3 = aux3 - ((aux3 >> 1) & 0x55555555);
        aux3 = (aux3 & 0x33333333) + ((aux3 >> 2) & 0x33333333);
        aux4 = aux4 - ((aux4 >> 1) & 0x55555555);
        aux4 = (aux4 & 0x33333333) + ((aux4 >> 2) & 0x33333333);
        aux5 = aux5 - ((aux5 >> 1) & 0x55555555);
        aux5 = (aux5 & 0x33333333) + ((aux5 >> 2) & 0x33333333);
        aux6 = aux6 - ((aux6 >> 1) & 0x55555555);
        aux6 = (aux6 & 0x33333333) + ((aux6 >> 2) & 0x33333333);
        aux7 = aux7 - ((aux7 >> 1) & 0x55555555);
        aux7 = (aux7 & 0x33333333) + ((aux7 >> 2) & 0x33333333);
        bits += ((((aux1 + (aux1 >> 4)) & 0x0F0F0F0F) +
                    ((aux2 + (aux2 >> 4)) & 0x0F0F0F0F) +
                    ((aux3 + (aux3 >> 4)) & 0x0F0F0F0F) +
                    ((aux4 + (aux4 >> 4)) & 0x0F0F0F0F) +
                    ((aux5 + (aux5 >> 4)) & 0x0F0F0F0F) +
                    ((aux6 + (aux6 >> 4)) & 0x0F0F0F0F) +
                    ((aux7 + (aux7 >> 4)) & 0x0F0F0F0F))* 0x01010101) >> 24;
    }
    /* Count the remaining bytes. */
    p = (unsigned char*)p4;
    while(count--) bits += bitsinbyte[*p++];
    return bits;
}

/* Return the position of the first bit set to one (if 'bit' is 1) or
 * zero (if 'bit' is 0) in the bitmap starting at 's' and long 'count' bytes.
 *
 * The function is guaranteed to return a value >= 0 if 'bit' is 0 since if
 * no zero bit is found, it returns count*8 assuming the string is zero
 * padded on the right. However if 'bit' is 1 it is possible that there is
 * not a single set bit in the bitmap. In this special case -1 is returned. */
long redisBitpos(void *s, unsigned long count, int bit) {
    unsigned long *l;
    unsigned char *c;
    unsigned long skipval, word = 0, one;
    long pos = 0; /* Position of bit, to return to the caller. */
    unsigned long j;

    /* Process whole words first, seeking for first word that is not
     * all ones or all zeros respectively if we are lookig for zeros
     * or ones. This is much faster with large strings having contiguous
     * blocks of 1 or 0 bits compared to the vanilla bit per bit processing.
     *
     * Note that if we start from an address that is not aligned
     * to sizeof(unsigned long) we consume it byte by byte until it is
     * aligned. */

    /* Skip initial bits not aligned to sizeof(unsigned long) byte by byte. */
    skipval = bit ? 0 : UCHAR_MAX;
    c = (unsigned char*) s;
    while((unsigned long)c & (sizeof(*l)-1) && count) {
        if (*c != skipval) break;
        c++;
        count--;
        pos += 8;
    }

    /* Skip bits with full word step. */
    skipval = bit ? 0 : ULONG_MAX;
    l = (unsigned long*) c;
    while (count >= sizeof(*l)) {
        if (*l != skipval) break;
        l++;
        count -= sizeof(*l);
        pos += sizeof(*l)*8;
    }

    /* Load bytes into "word" considering the first byte as the most significant
     * (we basically consider it as written in big endian, since we consider the
     * string as a set of bits from left to right, with the first bit at position
     * zero.
     *
     * Note that the loading is designed to work even when the bytes left
     * (count) are less than a full word. We pad it with zero on the right. */
    c = (unsigned char*)l;
    for (j = 0; j < sizeof(*l); j++) {
        word <<= 8;
        if (count) {
            word |= *c;
            c++;
            count--;
        }
    }

    /* Special case:
     * If bits in the string are all zero and we are looking for one,
     * return -1 to signal that there is not a single "1" in the whole
     * string. This can't happen when we are looking for "0" as we assume
     * that the right of the string is zero padded. */
    if (bit == 1 && word == 0) return -1;

    /* Last word left, scan bit by bit. The first thing we need is to
     * have a single "1" set in the most significant position in an
     * unsigned long. We don't know the size of the long so we use a
     * simple trick. */
    one = ULONG_MAX; /* All bits set to 1.*/
    one >>= 1;       /* All bits set to 1 but the MSB. */
    one = ~one;      /* All bits set to 0 but the MSB. */

    while(one) {
        if (((one & word) != 0) == bit) return pos;
        pos++;
        one >>= 1;
    }

    /* If we reached this point, there is a bug in the algorithm, since
     * the case of no match is handled as a special case before. */
    serverPanic("End of redisBitpos() reached.");
    return 0; /* Just to avoid warnings. */
}

/* The following set.*Bitfield and get.*Bitfield functions implement setting
 * and getting arbitrary size (up to 64 bits) signed and unsigned integers
 * at arbitrary positions into a bitmap.
 *
 * The representation considers the bitmap as having the bit number 0 to be
 * the most significant bit of the first byte, and so forth, so for example
 * setting a 5 bits unsigned integer to value 23 at offset 7 into a bitmap
 * previously set to all zeroes, will produce the following representation:
 *
 * +--------+--------+
 * |00000001|01110000|
 * +--------+--------+
 *
 * When offsets and integer sizes are aligned to bytes boundaries, this is the
 * same as big endian, however when such alignment does not exist, its important
 * to also understand how the bits inside a byte are ordered.
 *
 * Note that this format follows the same convention as SETBIT and related
 * commands.
 */

void setUnsignedBitfield(unsigned char *p, uint64_t offset, uint64_t bits, uint64_t value) {
    uint64_t byte, bit, byteval, bitval, j;

    for (j = 0; j < bits; j++) {
        bitval = (value & ((uint64_t)1<<(bits-1-j))) != 0;
        byte = offset >> 3;
        bit = 7 - (offset & 0x7);
        byteval = p[byte];
        byteval &= ~(1 << bit);
        byteval |= bitval << bit;
        p[byte] = byteval & 0xff;
        offset++;
    }
}

void setSignedBitfield(unsigned char *p, uint64_t offset, uint64_t bits, int64_t value) {
    uint64_t uv;

    if (value >= 0)
        uv = value;
    else
        uv = UINT64_MAX + value + 1;
    setUnsignedBitfield(p,offset,bits,uv);
}

uint64_t getUnsignedBitfield(unsigned char *p, uint64_t offset, uint64_t bits) {
    uint64_t byte, bit, byteval, bitval, j, value = 0;

    for (j = 0; j < bits; j++) {
        byte = offset >> 3;
        bit = 7 - (offset & 0x7);
        byteval = p[byte];
        bitval = (byteval >> bit) & 1;
        value = (value<<1) | bitval;
        offset++;
    }
    return value;
}

int64_t getSignedBitfield(unsigned char *p, uint64_t offset, uint64_t bits) {
    int64_t value = getUnsignedBitfield(p,offset,bits);
    /* If the top significant bit is 1, propagate it to all the
     * higher bits for two complement representation of signed
     * integers. */
    if (value & ((uint64_t)1 << (bits-1)))
        value |= ((uint64_t)-1) << bits;
    return value;
}

/* The following two functions detect overflow of a value in the context
 * of storing it as an unsigned or signed integer with the specified
 * number of bits. The functions both take the value and a possible increment.
 * If no overflow could happen and the value+increment fit inside the limits,
 * then zero is returned, otherwise in case of overflow, 1 is returned,
 * otherwise in case of underflow, -1 is returned.
 *
 * When non-zero is returned (oferflow or underflow), if not NULL, *limit is
 * set to the value the operation should result when an overflow happens,
 * depending on the specified overflow semantics:
 *
 * For BFOVERFLOW_SAT if 1 is returned, *limit it is set maximum value that
 * you can store in that integer. when -1 is returned, *limit is set to the
 * minimum value that an integer of that size can represent.
 *
 * For BFOVERFLOW_WRAP *limit is set by performing the operation in order to
 * "wrap" around towards zero for unsigned integers, or towards the most
 * negative number that is possible to represent for signed integers. */

#define BFOVERFLOW_WRAP 0
#define BFOVERFLOW_SAT 1
#define BFOVERFLOW_FAIL 2 /* Used by the BITFIELD command implementation. */

int checkUnsignedBitfieldOverflow(uint64_t value, int64_t incr, uint64_t bits, int owtype, uint64_t *limit) {
    uint64_t max = (bits == 64) ? UINT64_MAX : (((uint64_t)1<<bits)-1);
    int64_t maxincr = max-value;
    int64_t minincr = -value;

    if (value > max || (incr > 0 && incr > maxincr)) {
        if (limit) {
            if (owtype == BFOVERFLOW_WRAP) {
                goto handle_wrap;
            } else if (owtype == BFOVERFLOW_SAT) {
                *limit = max;
            }
        }
        return 1;
    } else if (incr < 0 && incr < minincr) {
        if (limit) {
            if (owtype == BFOVERFLOW_WRAP) {
                goto handle_wrap;
            } else if (owtype == BFOVERFLOW_SAT) {
                *limit = 0;
            }
        }
        return -1;
    }
    return 0;

handle_wrap:
    {
        uint64_t mask = ((int64_t)-1) << bits;
        uint64_t res = value+incr;

        res &= ~mask;
        *limit = res;
    }
    return 1;
}

int checkSignedBitfieldOverflow(int64_t value, int64_t incr, uint64_t bits, int owtype, int64_t *limit) {
    int64_t max = (bits == 64) ? INT64_MAX : (((int64_t)1<<(bits-1))-1);
    int64_t min = (-max)-1;

    /* Note that maxincr and minincr could overflow, but we use the values
     * only after checking 'value' range, so when we use it no overflow
     * happens. */
    int64_t maxincr = max-value;
    int64_t minincr = min-value;

    if (value > max || (bits != 64 && incr > maxincr) || (value >= 0 && incr > 0 && incr > maxincr))
    {
        if (limit) {
            if (owtype == BFOVERFLOW_WRAP) {
                goto handle_wrap;
            } else if (owtype == BFOVERFLOW_SAT) {
                *limit = max;
            }
        }
        return 1;
    } else if (value < min || (bits != 64 && incr < minincr) || (value < 0 && incr < 0 && incr < minincr)) {
        if (limit) {
            if (owtype == BFOVERFLOW_WRAP) {
                goto handle_wrap;
            } else if (owtype == BFOVERFLOW_SAT) {
                *limit = min;
            }
        }
        return -1;
    }
    return 0;

handle_wrap:
    {
        uint64_t mask = ((int64_t)-1) << bits;
        uint64_t msb = (uint64_t)1 << (bits-1);
        uint64_t a = value, b = incr, c;
        c = a+b; /* Perform addition as unsigned so that's defined. */

        /* If the sign bit is set, propagate to all the higher order
         * bits, to cap the negative value. If it's clear, mask to
         * the positive integer limit. */
        if (c & msb) {
            c |= mask;
        } else {
            c &= ~mask;
        }
        *limit = c;
    }
    return 1;
}

/* Debugging function. Just show bits in the specified bitmap. Not used
 * but here for not having to rewrite it when debugging is needed. */
void printBits(unsigned char *p, unsigned long count) {
    unsigned long j, i, byte;

    for (j = 0; j < count; j++) {
        byte = p[j];
        for (i = 0x80; i > 0; i /= 2)
            printf("%c", (byte & i) ? '1' : '0');
        printf("|");
    }
    printf("\n");
}

/* -----------------------------------------------------------------------------
 * Bits related string commands: GETBIT, SETBIT, BITCOUNT, BITOP.
 * -------------------------------------------------------------------------- */

#define BITOP_AND   0
#define BITOP_OR    1
#define BITOP_XOR   2
#define BITOP_NOT   3

#define BITFIELDOP_GET 0
#define BITFIELDOP_SET 1
#define BITFIELDOP_INCRBY 2

/* This helper function used by GETBIT / SETBIT parses the bit offset argument
 * making sure an error is returned if it is negative or if it overflows
 * Redis 512 MB limit for the string value.
 *
 * If the 'hash' argument is true, and 'bits is positive, then the command
 * will also parse bit offsets prefixed by "#". In such a case the offset
 * is multiplied by 'bits'. This is useful for the BITFIELD command. */
int getBitOffsetFromArgument(client *c, robj *o, size_t *offset, int hash, int bits) {
    long long loffset;
    char *err = "bit offset is not an integer or out of range";
    char *p = o->ptr;
    size_t plen = sdslen(p);
    int usehash = 0;

    /* Handle #<offset> form. */
    if (p[0] == '#' && hash && bits > 0) usehash = 1;

    if (string2ll(p+usehash,plen-usehash,&loffset) == 0) {
        addReplyError(c,err);
        return VR_ERROR;
    }

    /* Adjust the offset by 'bits' for #<offset> form. */
    if (usehash) loffset *= bits;

    /* Limit offset to 512MB in bytes */
    if ((loffset < 0) || ((unsigned long long)loffset >> 3) >= (512*1024*1024))
    {
        addReplyError(c,err);
        return VR_ERROR;
    }

    *offset = (size_t)loffset;
    return VR_OK;
}

/* This helper function for BITFIELD parses a bitfield type in the form
 * <sign><bits> where sign is 'u' or 'i' for unsigned and signed, and
 * the bits is a value between 1 and 64. However 64 bits unsigned integers
 * are reported as an error because of current limitations of Redis protocol
 * to return unsigned integer values greater than INT64_MAX.
 *
 * On error VR_ERROR is returned and an error is sent to the client. */
int getBitfieldTypeFromArgument(client *c, robj *o, int *sign, int *bits) {
    char *p = o->ptr;
    char *err = "Invalid bitfield type. Use something like i16 u8. Note that u64 is not supported but i64 is.";
    long long llbits;

    if (p[0] == 'i') {
        *sign = 1;
    } else if (p[0] == 'u') {
        *sign = 0;
    } else {
        addReplyError(c,err);
        return VR_ERROR;
    }

    if ((string2ll(p+1,strlen(p+1),&llbits)) == 0 ||
        llbits < 1 ||
        (*sign == 1 && llbits > 64) ||
        (*sign == 0 && llbits > 63))
    {
        addReplyError(c,err);
        return VR_ERROR;
    }
    *bits = llbits;
    return VR_OK;
}

/* This is an helper function for commands implementations that need to write
 * bits to a string object. The command creates or pad with zeroes the string
 * so that the 'maxbit' bit can be addressed. The object is finally
 * returned. Otherwise if the key holds a wrong type NULL is returned and
 * an error is sent to the client. */
robj *lookupStringForBitCommand(client *c, size_t maxbit, int *expired) {
    size_t byte = maxbit >> 3;
    robj *o = lookupKeyWrite(c->db,c->argv[1],expired);

    if (o == NULL) {
        o = createObject(OBJ_STRING,sdsnewlen(NULL, byte+1));
        dbAdd(c->db,c->argv[1],o);
    } else {
        if (checkType(c,o,OBJ_STRING)) return NULL;
        o = dbUnshareStringValue(c->db,c->argv[1],o);
        o->ptr = sdsgrowzero(o->ptr,byte+1);
    }
    return o;
}

/* SETBIT key offset bitvalue */
void setbitCommand(client *c) {
    robj *o;
    char *err = "bit is not an integer or out of range";
    size_t bitoffset;
    ssize_t byte, bit;
    int byteval, bitval;
    long on;
    int expired = 0;

    if (getBitOffsetFromArgument(c,c->argv[2],&bitoffset,0,0) != VR_OK)
        return;

    if (getLongFromObjectOrReply(c,c->argv[3],&on,err) != VR_OK)
        return;

    /* Bits can only be set or cleared... */
    if (on & ~1) {
        addReplyError(c,err);
        return;
    }

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    if ((o = lookupStringForBitCommand(c,bitoffset,&expired)) == NULL) { 
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }

    /* Get current values */
    byte = bitoffset >> 3;
    byteval = ((uint8_t*)o->ptr)[byte];
    bit = 7 - (bitoffset & 0x7);
    bitval = byteval & (1 << bit);

    /* Update byte with new bit value and return original value */
    byteval &= ~(1 << bit);
    byteval |= ((on & 0x1) << bit);
    ((uint8_t*)o->ptr)[byte] = byteval;
    signalModifiedKey(c->db,c->argv[1]);
    notifyKeyspaceEvent(NOTIFY_STRING,"setbit",c->argv[1],c->db->id);
    c->vel->dirty++;
    addReply(c, bitval ? shared.cone : shared.czero);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

/* GETBIT key offset */
void getbitCommand(client *c) {
    robj *o;
    char llbuf[32];
    size_t bitoffset;
    size_t byte, bit;
    size_t bitval = 0;

    if (getBitOffsetFromArgument(c,c->argv[2],&bitoffset,0,0) != VR_OK)
        return;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_STRING)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    byte = bitoffset >> 3;
    bit = 7 - (bitoffset & 0x7);
    if (sdsEncodedObject(o)) {
        if (byte < sdslen(o->ptr))
            bitval = ((uint8_t*)o->ptr)[byte] & (1 << bit);
    } else {
        if (byte < (size_t)ll2string(llbuf,sizeof(llbuf),(long)o->ptr))
            bitval = llbuf[byte] & (1 << bit);
    }

    addReply(c, bitval ? shared.cone : shared.czero);
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

/* BITOP op_name target_key src_key1 src_key2 src_key3 ... src_keyN */
void bitopCommand(client *c) {
    char *opname = c->argv[1]->ptr;
    robj *o, *targetkey = c->argv[2];
    unsigned long op, j, numkeys;
    robj **objects;      /* Array of source objects. */
    unsigned char **src; /* Array of source strings pointers. */
    unsigned long *len, maxlen = 0; /* Array of length of src strings,
                                       and max len. */
    unsigned long minlen = 0;    /* Min len among the input keys. */
    unsigned char *res = NULL; /* Resulting string. */

    /* Parse the operation name. */
    if ((opname[0] == 'a' || opname[0] == 'A') && !strcasecmp(opname,"and"))
        op = BITOP_AND;
    else if((opname[0] == 'o' || opname[0] == 'O') && !strcasecmp(opname,"or"))
        op = BITOP_OR;
    else if((opname[0] == 'x' || opname[0] == 'X') && !strcasecmp(opname,"xor"))
        op = BITOP_XOR;
    else if((opname[0] == 'n' || opname[0] == 'N') && !strcasecmp(opname,"not"))
        op = BITOP_NOT;
    else {
        addReply(c,shared.syntaxerr);
        return;
    }

    /* Sanity check: NOT accepts only a single key argument. */
    if (op == BITOP_NOT && c->argc != 4) {
        addReplyError(c,"BITOP NOT must be called with a single source key.");
        return;
    }

    /* Lookup keys, and store pointers to the string objects into an array. */
    numkeys = c->argc - 3;
    src = dalloc(sizeof(unsigned char*) * numkeys);
    len = dalloc(sizeof(long) * numkeys);
    objects = dalloc(sizeof(robj*) * numkeys);
    for (j = 0; j < numkeys; j++) {
        o = lookupKeyRead(c->db,c->argv[j+3]);
        /* Handle non-existing keys as empty strings. */
        if (o == NULL) {
            objects[j] = NULL;
            src[j] = NULL;
            len[j] = 0;
            minlen = 0;
            continue;
        }
        /* Return an error if one of the keys is not a string. */
        if (checkType(c,o,OBJ_STRING)) {
            unsigned long i;
            for (i = 0; i < j; i++) {
                if (objects[i])
                    decrRefCount(objects[i]);
            }
            dfree(src);
            dfree(len);
            dfree(objects);
            return;
        }
        objects[j] = getDecodedObject(o);
        src[j] = objects[j]->ptr;
        len[j] = sdslen(objects[j]->ptr);
        if (len[j] > maxlen) maxlen = len[j];
        if (j == 0 || len[j] < minlen) minlen = len[j];
    }

    /* Compute the bit operation, if at least one string is not empty. */
    if (maxlen) {
        res = (unsigned char*) sdsnewlen(NULL,maxlen);
        unsigned char output, byte;
        unsigned long i;

        /* Fast path: as far as we have data for all the input bitmaps we
         * can take a fast path that performs much better than the
         * vanilla algorithm. */
        j = 0;
        if (minlen >= sizeof(unsigned long)*4 && numkeys <= 16) {
            unsigned long *lp[16];
            unsigned long *lres = (unsigned long*) res;

            /* Note: sds pointer is always aligned to 8 byte boundary. */
            memcpy(lp,src,sizeof(unsigned long*)*numkeys);
            memcpy(res,src[0],minlen);

            /* Different branches per different operations for speed (sorry). */
            if (op == BITOP_AND) {
                while(minlen >= sizeof(unsigned long)*4) {
                    for (i = 1; i < numkeys; i++) {
                        lres[0] &= lp[i][0];
                        lres[1] &= lp[i][1];
                        lres[2] &= lp[i][2];
                        lres[3] &= lp[i][3];
                        lp[i]+=4;
                    }
                    lres+=4;
                    j += sizeof(unsigned long)*4;
                    minlen -= sizeof(unsigned long)*4;
                }
            } else if (op == BITOP_OR) {
                while(minlen >= sizeof(unsigned long)*4) {
                    for (i = 1; i < numkeys; i++) {
                        lres[0] |= lp[i][0];
                        lres[1] |= lp[i][1];
                        lres[2] |= lp[i][2];
                        lres[3] |= lp[i][3];
                        lp[i]+=4;
                    }
                    lres+=4;
                    j += sizeof(unsigned long)*4;
                    minlen -= sizeof(unsigned long)*4;
                }
            } else if (op == BITOP_XOR) {
                while(minlen >= sizeof(unsigned long)*4) {
                    for (i = 1; i < numkeys; i++) {
                        lres[0] ^= lp[i][0];
                        lres[1] ^= lp[i][1];
                        lres[2] ^= lp[i][2];
                        lres[3] ^= lp[i][3];
                        lp[i]+=4;
                    }
                    lres+=4;
                    j += sizeof(unsigned long)*4;
                    minlen -= sizeof(unsigned long)*4;
                }
            } else if (op == BITOP_NOT) {
                while(minlen >= sizeof(unsigned long)*4) {
                    lres[0] = ~lres[0];
                    lres[1] = ~lres[1];
                    lres[2] = ~lres[2];
                    lres[3] = ~lres[3];
                    lres+=4;
                    j += sizeof(unsigned long)*4;
                    minlen -= sizeof(unsigned long)*4;
                }
            }
        }

        /* j is set to the next byte to process by the previous loop. */
        for (; j < maxlen; j++) {
            output = (len[0] <= j) ? 0 : src[0][j];
            if (op == BITOP_NOT) output = ~output;
            for (i = 1; i < numkeys; i++) {
                byte = (len[i] <= j) ? 0 : src[i][j];
                switch(op) {
                case BITOP_AND: output &= byte; break;
                case BITOP_OR:  output |= byte; break;
                case BITOP_XOR: output ^= byte; break;
                }
            }
            res[j] = output;
        }
    }
    for (j = 0; j < numkeys; j++) {
        if (objects[j])
            decrRefCount(objects[j]);
    }
    dfree(src);
    dfree(len);
    dfree(objects);

    /* Store the computed value into the target key */
    if (maxlen) {
        o = createObject(OBJ_STRING,res);
        setKey(c->db,targetkey,o,NULL);
        notifyKeyspaceEvent(NOTIFY_STRING,"set",targetkey,c->db->id);
        decrRefCount(o);
    } else if (dbDelete(c->db,targetkey)) {
        signalModifiedKey(c->db,targetkey);
        notifyKeyspaceEvent(NOTIFY_GENERIC,"del",targetkey,c->db->id);
    }
    server.dirty++;
    addReplyLongLong(c,maxlen); /* Return the output string length in bytes. */
}

/* BITCOUNT key [start end] */
void bitcountCommand(client *c) {
    robj *o;
    long start, end, strlen;
    unsigned char *p;
    char llbuf[32];

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    /* Lookup, check for type, and return 0 for non existing keys. */
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_STRING)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    /* Set the 'p' pointer to the string, that can be just a stack allocated
     * array if our string was integer encoded. */
    if (o->encoding == OBJ_ENCODING_INT) {
        p = (unsigned char*) llbuf;
        strlen = ll2string(llbuf,sizeof(llbuf),(long)o->ptr);
    } else {
        p = (unsigned char*) o->ptr;
        strlen = sdslen(o->ptr);
    }

    /* Parse start/end range if any. */
    if (c->argc == 4) {
        if (getLongFromObjectOrReply(c,c->argv[2],&start,NULL) != VR_OK) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            return;
        }
        if (getLongFromObjectOrReply(c,c->argv[3],&end,NULL) != VR_OK) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            return;
        }
        /* Convert negative indexes */
        if (start < 0) start = strlen+start;
        if (end < 0) end = strlen+end;
        if (start < 0) start = 0;
        if (end < 0) end = 0;
        if (end >= strlen) end = strlen-1;
    } else if (c->argc == 2) {
        /* The whole string. */
        start = 0;
        end = strlen-1;
    } else {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        /* Syntax error. */
        addReply(c,shared.syntaxerr);
        return;
    }

    /* Precondition: end >= 0 && end < strlen, so the only condition where
     * zero can be returned is: start > end. */
    if (start > end) {
        addReply(c,shared.czero);
    } else {
        long bytes = end-start+1;

        addReplyLongLong(c,redisPopcount(p+start,bytes));
    }
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

/* BITPOS key bit [start [end]] */
void bitposCommand(client *c) {
    robj *o;
    long bit, start, end, strlen;
    unsigned char *p;
    char llbuf[32];
    int end_given = 0;

    /* Parse the bit argument to understand what we are looking for, set
     * or clear bits. */
    if (getLongFromObjectOrReply(c,c->argv[2],&bit,NULL) != VR_OK)
        return;
    if (bit != 0 && bit != 1) {
        addReplyError(c, "The bit argument must be 1 or 0.");
        return;
    }

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    /* If the key does not exist, from our point of view it is an infinite
     * array of 0 bits. If the user is looking for the fist clear bit return 0,
     * If the user is looking for the first set bit, return -1. */
    if ((o = lookupKeyRead(c->db,c->argv[1])) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        addReplyLongLong(c, bit ? -1 : 0);
        return;
    }
    if (checkType(c,o,OBJ_STRING)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    /* Set the 'p' pointer to the string, that can be just a stack allocated
     * array if our string was integer encoded. */
    if (o->encoding == OBJ_ENCODING_INT) {
        p = (unsigned char*) llbuf;
        strlen = ll2string(llbuf,sizeof(llbuf),(long)o->ptr);
    } else {
        p = (unsigned char*) o->ptr;
        strlen = sdslen(o->ptr);
    }

    /* Parse start/end range if any. */
    if (c->argc == 4 || c->argc == 5) {
        if (getLongFromObjectOrReply(c,c->argv[3],&start,NULL) != VR_OK) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            return;
        }
        if (c->argc == 5) {
            if (getLongFromObjectOrReply(c,c->argv[4],&end,NULL) != VR_OK) {
                unlockDb(c->db);
                update_stats_add(c->vel->stats, keyspace_hits, 1);
                return;
            }
            end_given = 1;
        } else {
            end = strlen-1;
        }
        /* Convert negative indexes */
        if (start < 0) start = strlen+start;
        if (end < 0) end = strlen+end;
        if (start < 0) start = 0;
        if (end < 0) end = 0;
        if (end >= strlen) end = strlen-1;
    } else if (c->argc == 3) {
        /* The whole string. */
        start = 0;
        end = strlen-1;
    } else {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        /* Syntax error. */
        addReply(c,shared.syntaxerr);
        return;
    }

    /* For empty ranges (start > end) we return -1 as an empty range does
     * not contain a 0 nor a 1. */
    if (start > end) {
        addReplyLongLong(c, -1);
    } else {
        long bytes = end-start+1;
        long pos = redisBitpos(p+start,bytes,bit);

        /* If we are looking for clear bits, and the user specified an exact
         * range with start-end, we can't consider the right of the range as
         * zero padded (as we do when no explicit end is given).
         *
         * So if redisBitpos() returns the first bit outside the range,
         * we return -1 to the caller, to mean, in the specified range there
         * is not a single "0" bit. */
        if (end_given && bit == 0 && pos == bytes*8) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            addReplyLongLong(c,-1);
            return;
        }
        if (pos != -1) pos += start*8; /* Adjust for the bytes we skipped. */
        addReplyLongLong(c,pos);
    }
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

/* BITFIELD key subcommmand-1 arg ... subcommand-2 arg ... subcommand-N ...
 *
 * Supported subcommands:
 *
 * GET <type> <offset>
 * SET <type> <offset> <value>
 * INCRBY <type> <offset> <increment>
 * OVERFLOW [WRAP|SAT|FAIL]
 */

struct bitfieldOp {
    uint64_t offset;    /* Bitfield offset. */
    int64_t i64;        /* Increment amount (INCRBY) or SET value */
    int opcode;         /* Operation id. */
    int owtype;         /* Overflow type to use. */
    int bits;           /* Integer bitfield bits width. */
    int sign;           /* True if signed, otherwise unsigned op. */
};

void bitfieldCommand(client *c) {
    robj *o;
    size_t bitoffset;
    int j, numops = 0, changes = 0;
    struct bitfieldOp *ops = NULL; /* Array of ops to execute at end. */
    int owtype = BFOVERFLOW_WRAP; /* Overflow type. */

    for (j = 2; j < c->argc; j++) {
        int remargs = c->argc-j-1; /* Remaining args other than current. */
        char *subcmd = c->argv[j]->ptr; /* Current command name. */
        int opcode; /* Current operation code. */
        long long i64 = 0;  /* Signed SET value. */
        int sign = 0; /* Signed or unsigned type? */
        int bits = 0; /* Bitfield width in bits. */

        if (!strcasecmp(subcmd,"get") && remargs >= 2)
            opcode = BITFIELDOP_GET;
        else if (!strcasecmp(subcmd,"set") && remargs >= 3)
            opcode = BITFIELDOP_SET;
        else if (!strcasecmp(subcmd,"incrby") && remargs >= 3)
            opcode = BITFIELDOP_INCRBY;
        else if (!strcasecmp(subcmd,"overflow") && remargs >= 1) {
            char *owtypename = c->argv[j+1]->ptr;
            j++;
            if (!strcasecmp(owtypename,"wrap"))
                owtype = BFOVERFLOW_WRAP;
            else if (!strcasecmp(owtypename,"sat"))
                owtype = BFOVERFLOW_SAT;
            else if (!strcasecmp(owtypename,"fail"))
                owtype = BFOVERFLOW_FAIL;
            else {
                addReplyError(c,"Invalid OVERFLOW type specified");
                dfree(ops);
                return;
            }
            continue;
        } else {
            addReply(c,shared.syntaxerr);
            dfree(ops);
            return;
        }

        /* Get the type and offset arguments, common to all the ops. */
        if (getBitfieldTypeFromArgument(c,c->argv[j+1],&sign,&bits) != VR_OK) {
            dfree(ops);
            return;
        }

        if (getBitOffsetFromArgument(c,c->argv[j+2],&bitoffset,1,bits) != VR_OK){
            dfree(ops);
            return;
        }

        /* INCRBY and SET require another argument. */
        if (opcode != BITFIELDOP_GET) {
            if (getLongLongFromObjectOrReply(c,c->argv[j+3],&i64,NULL) != VR_OK){
                dfree(ops);
                return;
            }
        }

        /* Populate the array of operations we'll process. */
        ops = drealloc(ops,sizeof(*ops)*(numops+1));
        ops[numops].offset = bitoffset;
        ops[numops].i64 = i64;
        ops[numops].opcode = opcode;
        ops[numops].owtype = owtype;
        ops[numops].bits = bits;
        ops[numops].sign = sign;
        numops++;

        j += 3 - (opcode == BITFIELDOP_GET);
    }

    addReplyMultiBulkLen(c,numops);

    /* Actually process the operations. */
    for (j = 0; j < numops; j++) {
        struct bitfieldOp *thisop = ops+j;

        /* Execute the operation. */
        if (thisop->opcode == BITFIELDOP_SET ||
            thisop->opcode == BITFIELDOP_INCRBY)
        {
            /* SET and INCRBY: We handle both with the same code path
             * for simplicity. SET return value is the previous value so
             * we need fetch & store as well. */

            /* Lookup by making room up to the farest bit reached by
             * this operation. */
            if ((o = lookupStringForBitCommand(c,
                thisop->offset + (thisop->bits-1), NULL)) == NULL) return;

            /* We need two different but very similar code paths for signed
             * and unsigned operations, since the set of functions to get/set
             * the integers and the used variables types are different. */
            if (thisop->sign) {
                int64_t oldval, newval, wrapped, retval;
                int overflow;

                oldval = getSignedBitfield(o->ptr,thisop->offset,
                        thisop->bits);

                if (thisop->opcode == BITFIELDOP_INCRBY) {
                    newval = oldval + thisop->i64;
                    overflow = checkSignedBitfieldOverflow(oldval,
                            thisop->i64,thisop->bits,thisop->owtype,&wrapped);
                    if (overflow) newval = wrapped;
                    retval = newval;
                } else {
                    newval = thisop->i64;
                    overflow = checkSignedBitfieldOverflow(newval,
                            0,thisop->bits,thisop->owtype,&wrapped);
                    if (overflow) newval = wrapped;
                    retval = oldval;
                }

                /* On overflow of type is "FAIL", don't write and return
                 * NULL to signal the condition. */
                if (!(overflow && thisop->owtype == BFOVERFLOW_FAIL)) {
                    addReplyLongLong(c,retval);
                    setSignedBitfield(o->ptr,thisop->offset,
                                      thisop->bits,newval);
                } else {
                    addReply(c,shared.nullbulk);
                }
            } else {
                uint64_t oldval, newval, wrapped, retval;
                int overflow;

                oldval = getUnsignedBitfield(o->ptr,thisop->offset,
                        thisop->bits);

                if (thisop->opcode == BITFIELDOP_INCRBY) {
                    newval = oldval + thisop->i64;
                    overflow = checkUnsignedBitfieldOverflow(oldval,
                            thisop->i64,thisop->bits,thisop->owtype,&wrapped);
                    if (overflow) newval = wrapped;
                    retval = newval;
                } else {
                    newval = thisop->i64;
                    overflow = checkUnsignedBitfieldOverflow(newval,
                            0,thisop->bits,thisop->owtype,&wrapped);
                    if (overflow) newval = wrapped;
                    retval = oldval;
                }
                /* On overflow of type is "FAIL", don't write and return
                 * NULL to signal the condition. */
                if (!(overflow && thisop->owtype == BFOVERFLOW_FAIL)) {
                    addReplyLongLong(c,retval);
                    setUnsignedBitfield(o->ptr,thisop->offset,
                                        thisop->bits,newval);
                } else {
                    addReply(c,shared.nullbulk);
                }
            }
            changes++;
        } else {
            /* GET */
            o = lookupKeyRead(c->db,c->argv[1]);
            size_t olen = (o == NULL) ? 0 : sdslen(o->ptr);
            unsigned char buf[9];

            /* For GET we use a trick: before executing the operation
             * copy up to 9 bytes to a local buffer, so that we can easily
             * execute up to 64 bit operations that are at actual string
             * object boundaries. */
            memset(buf,0,9);
            unsigned char *src = o ? o->ptr : NULL;
            int i;
            size_t byte = thisop->offset >> 3;
            for (i = 0; i < 9; i++) {
                if (src == NULL || i+byte >= olen) break;
                buf[i] = src[i+byte];
            }

            /* Now operate on the copied buffer which is guaranteed
             * to be zero-padded. */
            if (thisop->sign) {
                int64_t val = getSignedBitfield(buf,thisop->offset-(byte*8),
                                            thisop->bits);
                addReplyLongLong(c,val);
            } else {
                uint64_t val = getUnsignedBitfield(buf,thisop->offset-(byte*8),
                                            thisop->bits);
                addReplyLongLong(c,val);
            }
        }
    }

    if (changes) {
        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_STRING,"setbit",c->argv[1],c->db->id);
        server.dirty += changes;
    }
    dfree(ops);
}


================================================
FILE: src/vr_bitops.h
================================================
#ifndef _VR_BITOPS_H_
#define _VR_BITOPS_H_

size_t redisPopcount(void *s, long count);
long redisBitpos(void *s, unsigned long count, int bit);
void setUnsignedBitfield(unsigned char *p, uint64_t offset, uint64_t bits, uint64_t value);
void setSignedBitfield(unsigned char *p, uint64_t offset, uint64_t bits, int64_t value);
uint64_t getUnsignedBitfield(unsigned char *p, uint64_t offset, uint64_t bits);
int64_t getSignedBitfield(unsigned char *p, uint64_t offset, uint64_t bits);
int checkUnsignedBitfieldOverflow(uint64_t value, int64_t incr, uint64_t bits, int owtype, uint64_t *limit);
int checkSignedBitfieldOverflow(int64_t value, int64_t incr, uint64_t bits, int owtype, int64_t *limit);
void printBits(unsigned char *p, unsigned long count);
int getBitOffsetFromArgument(struct client *c, robj *o, size_t *offset, int hash, int bits);
int getBitfieldTypeFromArgument(struct client *c, robj *o, int *sign, int *bits);
robj *lookupStringForBitCommand(struct client *c, size_t maxbit, int *expired);
void setbitCommand(struct client *c);
void getbitCommand(struct client *c);
void bitopCommand(struct client *c);
void bitcountCommand(struct client *c);
void bitposCommand(struct client *c);
void bitfieldCommand(client *c);
#endif


================================================
FILE: src/vr_block.c
================================================
#include <vr_core.h>


/* Unblock a client calling the right function depending on the kind
 * of operation the client is blocking for. */
void unblockClient(client *c) {
    if (c->btype == BLOCKED_LIST) {
        unblockClientWaitingData(c);
    } else if (c->btype == BLOCKED_WAIT) {
        unblockClientWaitingReplicas(c);
    } else {
        serverPanic("Unknown btype in unblockClient().");
    }
    /* Clear the flags, and put the client in the unblocked list so that
     * we'll process new commands in its query buffer ASAP. */
    c->flags &= ~CLIENT_BLOCKED;
    c->btype = BLOCKED_NONE;
    c->vel->bpop_blocked_clients--;
    /* The client may already be into the unblocked list because of a previous
     * blocking operation, don't add back it into the list multiple times. */
    if (!(c->flags & CLIENT_UNBLOCKED)) {
        c->flags |= CLIENT_UNBLOCKED;
        dlistAddNodeTail(c->vel->unblocked_clients,c);
    }
}

/* Get a timeout value from an object and store it into 'timeout'.
 * The final timeout is always stored as milliseconds as a time where the
 * timeout will expire, however the parsing is performed according to
 * the 'unit' that can be seconds or milliseconds.
 *
 * Note that if the timeout is zero (usually from the point of view of
 * commands API this means no timeout) the value stored into 'timeout'
 * is zero. */
int getTimeoutFromObjectOrReply(client *c, robj *object, long long *timeout, int unit) {
    long long tval;

    if (getLongLongFromObjectOrReply(c,object,&tval,
        "timeout is not an integer or out of range") != VR_OK)
        return VR_ERROR;

    if (tval < 0) {
        addReplyError(c,"timeout is negative");
        return VR_ERROR;
    }

    if (tval > 0) {
        if (unit == UNIT_SECONDS) tval *= 1000;
        tval += vr_msec_now();
    }
    *timeout = tval;

    return VR_OK;
}

/* Block a client for the specific operation type. Once the CLIENT_BLOCKED
 * flag is set client query buffer is not longer processed, but accumulated,
 * and will be processed when the client is unblocked. */
void blockClient(client *c, int btype) {
    c->flags |= CLIENT_BLOCKED;
    c->btype = btype;
    c->vel->bpop_blocked_clients++;
}


================================================
FILE: src/vr_block.h
================================================
#ifndef _VR_BLOCK_H_
#define _VR_BLOCK_H_

/* This structure holds the blocking operation state for a client.
 * The fields used depend on client->btype. */
typedef struct blockingState {
    /* Generic fields. */
    long long timeout;       /* Blocking operation timeout. If UNIX current time
                             * is > timeout then the operation timed out. */

    /* BLOCKED_LIST */
    dict *keys;             /* The keys we are waiting to terminate a blocking
                             * operation such as BLPOP. Otherwise NULL. */
    robj *target;           /* The key that should receive the element,
                             * for BRPOPLPUSH. */

    /* BLOCKED_WAIT */
    int numreplicas;        /* Number of replicas we are waiting for ACK. */
    long long reploffset;   /* Replication offset to reach. */
} blockingState;

void blockClient(struct client *c, int btype);
void unblockClient(struct client *c);
int getTimeoutFromObjectOrReply(struct client *c, robj *object, long long *timeout, int unit);

#endif


================================================
FILE: src/vr_client.c
================================================
#include <vr_core.h>

int ncurr_cconn = 0;       /* current # client connections */

static void setProtocolError(client *c, int pos);

/* Return the size consumed from the allocator, for the specified SDS string,
 * including internal fragmentation. This function is used in order to compute
 * the client output buffer size. */
size_t sdsZmallocSize(sds s) {
    void *sh = sdsAllocPtr(s);
    return dmalloc_size(sh);
}

void *dupClientReplyValue(void *o) {
    return o;
}

void freeClientReplyValue(void *o) {
    freeObject(o);
}

int listMatchObjects(void *a, void *b) {
    return equalStringObjects(a,b);
}

client *createClient(vr_eventloop *vel, struct conn *conn) {
    client *c = dalloc(sizeof(client));

    /* passing -1 as fd it is possible to create a non connected client.
     * This is useful since all the commands needs to be executed
     * in the context of a client. When commands are executed in other
     * contexts (for instance a Lua script) we need a non connected client. */
    if (conn->sd != -1) {
        vr_set_nonblocking(conn->sd);
        vr_set_tcpnodelay(conn->sd);
        if (server.tcpkeepalive)
            vr_set_tcpkeepalive(conn->sd,server.tcpkeepalive,0,0);
        if (aeCreateFileEvent(vel->el,conn->sd,AE_READABLE,
            readQueryFromClient, c) == AE_ERR)
        {
            log_error("Unrecoverable error creating client ipfd file event.");
            dfree(c);
            return NULL;
        }
    }

    selectDb(c,0);
    c->id = vel->next_client_id++;
    c->conn = conn;
    c->vel = vel;
    c->scanid = -1;
    c->name = NULL;
    c->bufpos = 0;
    c->querybuf = sdsempty();
    c->querybuf_peak = 0;
    c->reqtype = 0;
    c->argc = 0;
    c->argv = NULL;
    c->cmd = c->lastcmd = NULL;
    c->multibulklen = 0;
    c->bulklen = -1;
    c->sentlen = 0;
    c->flags = 0;
    c->ctime = c->lastinteraction = vel->unixtime;
    c->authenticated = 0;
    c->replstate = REPL_STATE_NONE;
    c->repl_put_online_on_ack = 0;
    c->reploff = 0;
    c->repl_ack_off = 0;
    c->repl_ack_time = 0;
    c->slave_listening_port = 0;
    c->slave_capa = SLAVE_CAPA_NONE;
    c->reply = dlistCreate();
    c->reply_bytes = 0;
    c->obuf_soft_limit_reached_time = 0;
    dlistSetFreeMethod(c->reply,freeClientReplyValue);
    dlistSetDupMethod(c->reply,dupClientReplyValue);
    c->btype = BLOCKED_NONE;
    c->bpop.timeout = 0;
    c->bpop.keys = dictCreate(&setDictType,NULL);
    c->bpop.target = NULL;
    c->bpop.numreplicas = 0;
    c->bpop.reploffset = 0;
    c->woff = 0;
    c->watched_keys = dlistCreate();
    c->pubsub_channels = dictCreate(&setDictType,NULL);
    c->pubsub_patterns = dlistCreate();
    c->peerid = NULL;
    c->curidx = -1;
    c->taridx = -1;
    c->steps = 0;
    c->cache = NULL;
    dlistSetFreeMethod(c->pubsub_patterns,decrRefCountVoid);
    dlistSetMatchMethod(c->pubsub_patterns,listMatchObjects);
    if (conn->sd != -1) dlistAddNodeTail(vel->clients,c);
    initClientMultiState(c);
    return c;
}

/* This function is called every time we are going to transmit new data
 * to the client. The behavior is the following:
 *
 * If the client should receive new data (normal clients will) the function
 * returns VR_OK, and make sure to install the write handler in our event
 * loop so that when the socket is writable new data gets written.
 *
 * If the client should not receive new data, because it is a fake client
 * (used to load AOF in memory), a master or because the setup of the write
 * handler failed, the function returns VR_ERROR.
 *
 * The function may return VR_OK without actually installing the write
 * event handler in the following cases:
 *
 * 1) The event handler should already be installed since the output buffer
 *    already contained something.
 * 2) The client is a slave but not yet online, so we want to just accumulate
 *    writes in the buffer but not actually sending them yet.
 *
 * Typically gets called every time a reply is built, before adding more
 * data to the clients output buffers. If the function returns VR_ERROR no
 * data should be appended to the output buffers. */
int prepareClientToWrite(client *c) {
    /* If it's the Lua client we always return ok without installing any
     * handler since there is no socket at all. */
    if (c->flags & CLIENT_LUA) return VR_OK;

    /* CLIENT REPLY OFF / SKIP handling: don't send replies. */
    if (c->flags & (CLIENT_REPLY_OFF|CLIENT_REPLY_SKIP)) return VR_ERROR;

    /* Masters don't receive replies, unless CLIENT_MASTER_FORCE_REPLY flag
     * is set. */
    if ((c->flags & CLIENT_MASTER) &&
        !(c->flags & CLIENT_MASTER_FORCE_REPLY)) return VR_ERROR;

    if (c->conn->sd <= 0) return VR_ERROR; /* Fake client for AOF loading. */

    /* Schedule the client to write the output buffers to the socket only
     * if not already done (there were no pending writes already and the client
     * was yet not flagged), and, for slaves, if the slave can actually
     * receive writes at this stage. */
    if (!clientHasPendingReplies(c) &&
        !(c->flags & CLIENT_PENDING_WRITE) &&
        (c->replstate == REPL_STATE_NONE ||
         (c->replstate == SLAVE_STATE_ONLINE && !c->repl_put_online_on_ack)))
    {
        /* Here instead of installing the write handler, we just flag the
         * client and put it into a list of clients that have something
         * to write to the socket. This way before re-entering the event
         * loop, we can try to directly write to the client sockets avoiding
         * a system call. We'll only really install the write handler if
         * we'll not be able to write the whole reply at once. */
        c->flags |= CLIENT_PENDING_WRITE;
        dlistAddNodeHead(c->vel->clients_pending_write,c);
    }

    /* Authorize the caller to queue in the output buffer of this client. */
    return VR_OK;
}

/* Create a duplicate of the last object in the reply list when
 * it is not exclusively owned by the reply list. */
robj *dupLastObjectIfNeeded(dlist *reply) {
    robj *new, *cur;
    dlistNode *ln;
    ASSERT(dlistLength(reply) > 0);
    ln = dlistLast(reply);
    cur = dlistNodeValue(ln);
    if (cur->constant) {
        new = dupStringObject(cur);
        dlistNodeValue(ln) = new;
    }
    return dlistNodeValue(ln);
}

/* -----------------------------------------------------------------------------
 * Low level functions to add more data to output buffers.
 * -------------------------------------------------------------------------- */

int _addReplyToBuffer(client *c, const char *s, size_t len) {
    size_t available = sizeof(c->buf)-c->bufpos;

    if (c->flags & CLIENT_CLOSE_AFTER_REPLY) return VR_OK;

    /* If there already are entries in the reply list, we cannot
     * add anything more to the static buffer. */
    if (dlistLength(c->reply) > 0) return VR_ERROR;

    /* Check that the buffer has enough space available for this string. */
    if (len > available) return VR_ERROR;

    memcpy(c->buf+c->bufpos,s,len);
    c->bufpos+=len;
    return VR_OK;
}

void _addReplyObjectToList(client *c, robj *o) {
    robj *tail, *obj;

    if (c->flags & CLIENT_CLOSE_AFTER_REPLY) return;

    if (dlistLength(c->reply) == 0) {
        if (o->constant)
            obj = o;
        else
            obj = dupStringObject(o);
        dlistAddNodeTail(c->reply,obj);
        c->reply_bytes += getStringObjectSdsUsedMemory(obj);
    } else {
        tail = dlistNodeValue(dlistLast(c->reply));

        /* Append to this object when possible. */
        if (tail->ptr != NULL &&
            tail->encoding == OBJ_ENCODING_RAW &&
            sdslen(tail->ptr)+sdslen(o->ptr) <= PROTO_REPLY_CHUNK_BYTES)
        {
            c->reply_bytes -= sdsZmallocSize(tail->ptr);
            tail = dupLastObjectIfNeeded(c->reply);
            tail->ptr = sdscatlen(tail->ptr,o->ptr,sdslen(o->ptr));
            c->reply_bytes += sdsZmallocSize(tail->ptr);
        } else {
            if (o->constant)
                obj = o;
            else
                obj = dupStringObject(o);
            dlistAddNodeTail(c->reply,obj);
            c->reply_bytes += getStringObjectSdsUsedMemory(obj);
        }
    }
    asyncCloseClientOnOutputBufferLimitReached(c);
}

/* This method takes responsibility over the sds. When it is no longer
 * needed it will be free'd, otherwise it ends up in a robj. */
void _addReplySdsToList(client *c, sds s) {
    robj *tail;

    if (c->flags & CLIENT_CLOSE_AFTER_REPLY) {
        sdsfree(s);
        return;
    }

    if (dlistLength(c->reply) == 0) {
        dlistAddNodeTail(c->reply,createObject(OBJ_STRING,s));
        c->reply_bytes += sdsZmallocSize(s);
    } else {
        tail = dlistNodeValue(dlistLast(c->reply));

        /* Append to this object when possible. */
        if (tail->ptr != NULL && tail->encoding == OBJ_ENCODING_RAW &&
            sdslen(tail->ptr)+sdslen(s) <= PROTO_REPLY_CHUNK_BYTES)
        {
            c->reply_bytes -= sdsZmallocSize(tail->ptr);
            tail = dupLastObjectIfNeeded(c->reply);
            tail->ptr = sdscatlen(tail->ptr,s,sdslen(s));
            c->reply_bytes += sdsZmallocSize(tail->ptr);
            sdsfree(s);
        } else {
            dlistAddNodeTail(c->reply,createObject(OBJ_STRING,s));
            c->reply_bytes += sdsZmallocSize(s);
        }
    }
    asyncCloseClientOnOutputBufferLimitReached(c);
}

void _addReplyStringToList(client *c, const char *s, size_t len) {
    robj *tail;

    if (c->flags & CLIENT_CLOSE_AFTER_REPLY) return;

    if (dlistLength(c->reply) == 0) {
        robj *o = createStringObject(s,len);

        dlistAddNodeTail(c->reply,o);
        c->reply_bytes += getStringObjectSdsUsedMemory(o);
    } else {
        tail = dlistNodeValue(dlistLast(c->reply));

        /* Append to this object when possible. */
        if (tail->ptr != NULL && tail->encoding == OBJ_ENCODING_RAW &&
            sdslen(tail->ptr)+len <= PROTO_REPLY_CHUNK_BYTES)
        {
            c->reply_bytes -= sdsZmallocSize(tail->ptr);
            tail = dupLastObjectIfNeeded(c->reply);
            tail->ptr = sdscatlen(tail->ptr,s,len);
            c->reply_bytes += sdsZmallocSize(tail->ptr);
        } else {
            robj *o = createStringObject(s,len);

            dlistAddNodeTail(c->reply,o);
            c->reply_bytes += getStringObjectSdsUsedMemory(o);
        }
    }
    asyncCloseClientOnOutputBufferLimitReached(c);
}

/* -----------------------------------------------------------------------------
 * Higher level functions to queue data on the client output buffer.
 * The following functions are the ones that commands implementations will call.
 * -------------------------------------------------------------------------- */

void addReply(client *c, robj *obj) {
    if (prepareClientToWrite(c) != VR_OK) return;

    /* This is an important place where we can avoid copy-on-write
     * when there is a saving child running, avoiding touching the
     * refcount field of the object if it's not needed.
     *
     * If the encoding is RAW and there is room in the static buffer
     * we'll be able to send the object to the client without
     * messing with its page. */
    if (sdsEncodedObject(obj)) {
        if (_addReplyToBuffer(c,obj->ptr,sdslen(obj->ptr)) != VR_OK)
            _addReplyObjectToList(c,obj);
    } else if (obj->encoding == OBJ_ENCODING_INT) {
        robj *obj_new;
        /* Optimization: if there is room in the static buffer for 32 bytes
         * (more than the max chars a 64 bit integer can take as string) we
         * avoid decoding the object and go for the lower level approach. */
        if (dlistLength(c->reply) == 0 && (sizeof(c->buf) - c->bufpos) >= 32) {
            char buf[32];
            int len;

            len = ll2string(buf,sizeof(buf),(long)obj->ptr);
            if (_addReplyToBuffer(c,buf,len) == VR_OK)
                return;
            /* else... continue with the normal code path, but should never
             * happen actually since we verified there is room. */
        }
        obj_new = getDecodedObject(obj);
        if (_addReplyToBuffer(c,obj_new->ptr,sdslen(obj_new->ptr)) != VR_OK)
            _addReplyObjectToList(c,obj_new);
        if (obj_new != obj) freeObject(obj_new);
    } else {
        serverPanic("Wrong obj->encoding in addReply()");
    }
}

void addReplySds(client *c, sds s) {
    if (prepareClientToWrite(c) != VR_OK) {
        /* The caller expects the sds to be free'd. */
        sdsfree(s);
        return;
    }
    if (_addReplyToBuffer(c,s,sdslen(s)) == VR_OK) {
        sdsfree(s);
    } else {
        /* This method free's the sds when it is no longer needed. */
        _addReplySdsToList(c,s);
    }
}

void addReplyString(client *c, const char *s, size_t len) {
    if (prepareClientToWrite(c) != VR_OK) return;
    if (_addReplyToBuffer(c,s,len) != VR_OK)
        _addReplyStringToList(c,s,len);
}

void addReplyErrorLength(client *c, const char *s, size_t len) {
    addReplyString(c,"-ERR ",5);
    addReplyString(c,s,len);
    addReplyString(c,"\r\n",2);
}

void addReplyError(client *c, const char *err) {
    addReplyErrorLength(c,err,strlen(err));
}

void addReplyErrorFormat(client *c, const char *fmt, ...) {
    size_t l, j;
    va_list ap;
    va_start(ap,fmt);
    sds s = sdscatvprintf(sdsempty(),fmt,ap);
    va_end(ap);
    /* Make sure there are no newlines in the string, otherwise invalid protocol
     * is emitted. */
    l = sdslen(s);
    for (j = 0; j < l; j++) {
        if (s[j] == '\r' || s[j] == '\n') s[j] = ' ';
    }
    addReplyErrorLength(c,s,sdslen(s));
    sdsfree(s);
}

void addReplyStatusLength(client *c, const char *s, size_t len) {
    addReplyString(c,"+",1);
    addReplyString(c,s,len);
    addReplyString(c,"\r\n",2);
}

void addReplyStatus(client *c, const char *status) {
    addReplyStatusLength(c,status,strlen(status));
}

void addReplyStatusFormat(client *c, const char *fmt, ...) {
    va_list ap;
    va_start(ap,fmt);
    sds s = sdscatvprintf(sdsempty(),fmt,ap);
    va_end(ap);
    addReplyStatusLength(c,s,sdslen(s));
    sdsfree(s);
}

/* Adds an empty object to the reply list that will contain the multi bulk
 * length, which is not known when this function is called. */
void *addDeferredMultiBulkLength(client *c) {
    /* Note that we install the write event here even if the object is not
     * ready to be sent, since we are sure that before returning to the
     * event loop setDeferredMultiBulkLength() will be called. */
    if (prepareClientToWrite(c) != VR_OK) return NULL;
    dlistAddNodeTail(c->reply,createObject(OBJ_STRING,NULL));
    return dlistLast(c->reply);
}

/* Populate the length object and try gluing it to the next chunk. */
void setDeferredMultiBulkLength(client *c, void *node, long length) {
    dlistNode *ln = (dlistNode*)node;
    robj *len, *next;

    /* Abort when *node is NULL (see addDeferredMultiBulkLength). */
    if (node == NULL) return;

    len = dlistNodeValue(ln);
    len->ptr = sdscatprintf(sdsempty(),"*%ld\r\n",length);
    len->encoding = OBJ_ENCODING_RAW; /* in case it was an EMBSTR. */
    c->reply_bytes += sdsZmallocSize(len->ptr);
    if (ln->next != NULL) {
        next = dlistNodeValue(ln->next);

        /* Only glue when the next node is non-NULL (an sds in this case) */
        if (next->ptr != NULL) {
            c->reply_bytes -= sdsZmallocSize(len->ptr);
            c->reply_bytes -= getStringObjectSdsUsedMemory(next);
            len->ptr = sdscatlen(len->ptr,next->ptr,sdslen(next->ptr));
            c->reply_bytes += sdsZmallocSize(len->ptr);
            dlistDelNode(c->reply,ln->next);
        }
    }
    asyncCloseClientOnOutputBufferLimitReached(c);
}

/* Add a double as a bulk reply */
void addReplyDouble(client *c, double d) {
    char dbuf[128], sbuf[128];
    int dlen, slen;
    if (isinf(d)) {
        /* Libc in odd systems (Hi Solaris!) will format infinite in a
         * different way, so better to handle it in an explicit way. */
        addReplyBulkCString(c, d > 0 ? "inf" : "-inf");
    } else {
        dlen = snprintf(dbuf,sizeof(dbuf),"%.17g",d);
        slen = snprintf(sbuf,sizeof(sbuf),"$%d\r\n%s\r\n",dlen,dbuf);
        addReplyString(c,sbuf,slen);
    }
}

/* Add a long double as a bulk reply, but uses a human readable formatting
 * of the double instead of exposing the crude behavior of doubles to the
 * dear user. */
void addReplyHumanLongDouble(client *c, long double d) {
    robj *o = createStringObjectFromLongDouble(d,1);
    addReplyBulk(c,o);
    decrRefCount(o);
}

/* Add a long long as integer reply or bulk len / multi bulk count.
 * Basically this is used to output <prefix><long long><crlf>. */
void addReplyLongLongWithPrefix(client *c, long long ll, char prefix) {
    char buf[128];
    int len;

    /* Things like $3\r\n or *2\r\n are emitted very often by the protocol
     * so we have a few shared objects to use if the integer is small
     * like it is most of the times. */
    if (prefix == '*' && ll < OBJ_SHARED_BULKHDR_LEN && ll >= 0) {
        addReply(c,shared.mbulkhdr[ll]);
        return;
    } else if (prefix == '$' && ll < OBJ_SHARED_BULKHDR_LEN && ll >= 0) {
        addReply(c,shared.bulkhdr[ll]);
        return;
    }

    buf[0] = prefix;
    len = ll2string(buf+1,sizeof(buf)-1,ll);
    buf[len+1] = '\r';
    buf[len+2] = '\n';
    addReplyString(c,buf,len+3);
}

void addReplyLongLong(client *c, long long ll) {
    if (ll == 0)
        addReply(c,shared.czero);
    else if (ll == 1)
        addReply(c,shared.cone);
    else
        addReplyLongLongWithPrefix(c,ll,':');
}

void addReplyMultiBulkLen(client *c, long length) {
    if (length < OBJ_SHARED_BULKHDR_LEN)
        addReply(c,shared.mbulkhdr[length]);
    else
        addReplyLongLongWithPrefix(c,length,'*');
}

/* Create the length prefix of a bulk reply, example: $2234 */
void addReplyBulkLen(client *c, robj *obj) {
    size_t len;

    if (sdsEncodedObject(obj)) {
        len = sdslen(obj->ptr);
    } else {
        long n = (long)obj->ptr;

        /* Compute how many bytes will take this integer as a radix 10 string */
        len = 1;
        if (n < 0) {
            len++;
            n = -n;
        }
        while((n = n/10) != 0) {
            len++;
        }
    }

    if (len < OBJ_SHARED_BULKHDR_LEN)
        addReply(c,shared.bulkhdr[len]);
    else
        addReplyLongLongWithPrefix(c,len,'$');
}

/* Add a Redis Object as a bulk reply */
void addReplyBulk(client *c, robj *obj) {
    addReplyBulkLen(c,obj);
    addReply(c,obj);
    addReply(c,shared.crlf);
}

/* Add a C buffer as bulk reply */
void addReplyBulkCBuffer(client *c, const void *p, size_t len) {
    addReplyLongLongWithPrefix(c,len,'$');
    addReplyString(c,p,len);
    addReply(c,shared.crlf);
}

/* Add sds to reply (takes ownership of this sds and frees it) */
void addReplyBulkSds(client *c, sds s)  {
    addReplySds(c,sdscatfmt(sdsempty(),"$%u\r\n",
        (unsigned long)sdslen(s)));
    addReplySds(c,s);
    addReply(c,shared.crlf);
}

/* Add a C nul term string as bulk reply */
void addReplyBulkCString(client *c, const char *s) {
    if (s == NULL) {
        addReply(c,shared.nullbulk);
    } else {
        addReplyBulkCBuffer(c,s,strlen(s));
    }
}

/* Add a long long as a bulk reply */
void addReplyBulkLongLong(client *c, long long ll) {
    char buf[64];
    int len;

    len = ll2string(buf,64,ll);
    addReplyBulkCBuffer(c,buf,len);
}

/* Copy 'src' client output buffers into 'dst' client output buffers.
 * The function takes care of freeing the old output buffers of the
 * destination client. */
void copyClientOutputBuffer(client *dst, client *src) {
    dlistRelease(dst->reply);
    dst->reply = dlistDup(src->reply);
    memcpy(dst->buf,src->buf,src->bufpos);
    dst->bufpos = src->bufpos;
    dst->reply_bytes = src->reply_bytes;
}

/* Return true if the specified client has pending reply buffers to write to
 * the socket. */
int clientHasPendingReplies(client *c) {
    return c->bufpos || dlistLength(c->reply);
}

static void freeClientArgv(client *c) {
    int j;
    for (j = 0; j < c->argc; j++)
        freeObject(c->argv[j]);
    c->argc = 0;
    c->cmd = NULL;
}

/* Close all the slaves connections. This is useful in chained replication
 * when we resync with our own master and want to force all our slaves to
 * resync with us as well. */
void disconnectSlaves(void) {
    while (dlistLength(repl.slaves)) {
        dlistNode *ln = dlistFirst(repl.slaves);
        freeClient((client*)ln->value);
    }
}

/* Remove the specified client from eventloop lists where the client could
 * be referenced from this eventloop, not including the Pub/Sub channels.
 * This is used by clients jump between workers. */
void unlinkClientFromEventloop(client *c) {
    dlistNode *ln;
    vr_eventloop *vel = c->vel;

    c->vel = NULL;

    if (c->steps >= 1) return;
    
    /* If this is marked as current client unset it. */
    if (vel->current_client == c) vel->current_client = NULL;

    /* Certain operations must be done only if the client has an active socket.
     * If the client was already unlinked or if it's a "fake client" the
     * fd is already set to -1. */
    if (c->conn->sd != -1) {
        /* Remove from the list of active clients. */
        ln = dlistSearchKey(vel->clients,c);
        ASSERT(ln != NULL);
        dlistDelNode(vel->clients,ln);

        /* Unregister async I/O handlers and close the socket. */
        aeDeleteFileEvent(vel->el,c->conn->sd,AE_READABLE);
        aeDeleteFileEvent(vel->el,c->conn->sd,AE_WRITABLE);
    }

    /* Remove from the list of pending writes if needed. */
    if (c->flags & CLIENT_PENDING_WRITE) {
        ln = dlistSearchKey(vel->clients_pending_write,c);
        ASSERT(ln != NULL);
        dlistDelNode(vel->clients_pending_write,ln);
        c->flags &= ~CLIENT_PENDING_WRITE;
    }

    /* When client was just unblocked because of a blocking operation,
     * remove it from the list of unblocked clients. */
    if (c->flags & CLIENT_UNBLOCKED) {
        ln = dlistSearchKey(vel->unblocked_clients,c);
        ASSERT(ln != NULL);
        dlistDelNode(vel->unblocked_clients,ln);
        c->flags &= ~CLIENT_UNBLOCKED;
    }
}

void linkClientToEventloop(client *c,vr_eventloop *vel) {
    dlistPush(vel->clients,c);
    c->vel = vel;
    if (aeCreateFileEvent(vel->el,c->conn->sd,AE_READABLE,
        readQueryFromClient,c) == AE_ERR)
    {
        freeClient(c);
        return;
    }

    /* Handle the remain query buffer */
    processInputBuffer(c);
    if (c->flags&CLIENT_JUMP) {
        dispatch_conn_exist(c,c->taridx);
    } else {
        if (clientHasPendingReplies(c) && 
            !(c->flags&CLIENT_PENDING_WRITE)) {
            if (aeCreateFileEvent(vel->el, c->conn->sd, AE_WRITABLE,
                sendReplyToClient, c) == AE_ERR)
            {
                freeClientAsync(c);
            }
        }
    }
}

/* Remove the specified client from global lists where the client could
 * be referenced, not including the Pub/Sub channels.
 * This is used by freeClient() and replicationCacheMaster(). */
void unlinkClient(client *c) {
    dlistNode *ln;

    /* If this is marked as current client unset it. */
    if (c->vel->current_client == c) c->vel->current_client = NULL;

    /* Certain operations must be done only if the client has an active socket.
     * If the client was already unlinked or if it's a "fake client" the
     * fd is already set to -1. */
    if (c->conn->sd != -1) {
        /* Remove from the list of active clients. */
        ln = dlistSearchKey(c->vel->clients,c);
        ASSERT(ln != NULL);
        dlistDelNode(c->vel->clients,ln);

        /* Unregister async I/O handlers and close the socket. */
        aeDeleteFileEvent(c->vel->el,c->conn->sd,AE_READABLE);
        aeDeleteFileEvent(c->vel->el,c->conn->sd,AE_WRITABLE);
        conn_put(c->conn);
        c->conn = NULL;
    }

    /* Remove from the list of pending writes if needed. */
    if (c->flags & CLIENT_PENDING_WRITE) {
        ln = dlistSearchKey(c->vel->clients_pending_write,c);
        ASSERT(ln != NULL);
        dlistDelNode(c->vel->clients_pending_write,ln);
        c->flags &= ~CLIENT_PENDING_WRITE;
    }

    /* When client was just unblocked because of a blocking operation,
     * remove it from the list of unblocked clients. */
    if (c->flags & CLIENT_UNBLOCKED) {
        ln = dlistSearchKey(c->vel->unblocked_clients,c);
        ASSERT(ln != NULL);
        dlistDelNode(c->vel->unblocked_clients,ln);
        c->flags &= ~CLIENT_UNBLOCKED;
    }
}

void freeClient(client *c) {
    dlistNode *ln;

    /* If it is our master that's beging disconnected we should make sure
     * to cache the state to try a partial resynchronization later.
     *
     * Note that before doing this we make sure that the client is not in
     * some unexpected state, by checking its flags. */
    if (repl.role == REPLICATION_ROLE_MASTER && c->flags & CLIENT_MASTER) {
        log_warn("connection with master lost.");
        if (!(c->flags & (CLIENT_CLOSE_AFTER_REPLY|
                          CLIENT_CLOSE_ASAP|
                          CLIENT_BLOCKED|
                          CLIENT_UNBLOCKED)))
        {
            replicationCacheMaster(c);
            return;
        }
    }

    /* Log link disconnection with slave */
    if ((c->flags & CLIENT_SLAVE) && !(c->flags & CLIENT_MONITOR)) {
        log_warn("connection with slave %s lost.",
            replicationGetSlaveName(c));
    }

    /* Free the query buffer */
    sdsfree(c->querybuf);
    c->querybuf = NULL;

    /* Deallocate structures used to block on blocking ops. */
    if (c->flags & CLIENT_BLOCKED) unblockClient(c);
    dictRelease(c->bpop.keys);

    /* UNWATCH all the keys */
    unwatchAllKeys(c);
    dlistRelease(c->watched_keys);

    /* Unsubscribe from all the pubsub channels */
    pubsubUnsubscribeAllChannels(c,0);
    pubsubUnsubscribeAllPatterns(c,0);
    dictRelease(c->pubsub_channels);
    dlistRelease(c->pubsub_patterns);

    /* Free data structures. */
    dlistRelease(c->reply);
    freeClientArgv(c);

    /* Unlink the client: this will close the socket, remove the I/O
     * handlers, and remove references of the client from different
     * places where active clients may be referenced. */
    unlinkClient(c);

    /* Master/slave cleanup Case 1:
     * we lost the connection with a slave. */
    if (c->flags & CLIENT_SLAVE) {
        if (c->replstate == SLAVE_STATE_SEND_BULK) {
            if (c->repldbfd != -1) close(c->repldbfd);
            if (c->replpreamble) sdsfree(c->replpreamble);
        }
        dlist *l = (c->flags & CLIENT_MONITOR) ? server.monitors : repl.slaves;
        ln = dlistSearchKey(l,c);
        ASSERT(ln != NULL);
        dlistDelNode(l,ln);
        /* We need to remember the time when we started to have zero
         * attached slaves, as after some time we'll free the replication
         * backlog. */
        if (c->flags & CLIENT_SLAVE && dlistLength(repl.slaves) == 0)
            repl.repl_no_slaves_since = c->vel->unixtime;
        refreshGoodSlavesCount();
    }

    /* Master/slave cleanup Case 2:
     * we lost the connection with the master. */
    if (c->flags & CLIENT_MASTER) replicationHandleMasterDisconnection();

    /* If this client was scheduled for async freeing we need to remove it
     * from the queue. */
    if (c->flags & CLIENT_CLOSE_ASAP) {
        ln = dlistSearchKey(c->vel->clients_to_close,c);
        ASSERT(ln != NULL);
        dlistDelNode(c->vel->clients_to_close,ln);
    }

    /* Release other dynamically allocated client structure fields,
     * and finally release the client structure itself. */
    if (c->name) freeObject(c->name);
    if (c->argv) dfree(c->argv);
    freeClientMultiState(c);
    sdsfree(c->peerid);
    dfree(c);
}

/* Schedule a client to free it at a safe time in the serverCron() function.
 * This function is useful when we need to terminate a client but we are in
 * a context where calling freeClient() is not possible, because the client
 * should be valid for the continuation of the flow of the program. */
void freeClientAsync(client *c) {
    if (c->flags & CLIENT_CLOSE_ASAP || c->flags & CLIENT_LUA) return;
    c->flags |= CLIENT_CLOSE_ASAP;
    dlistAddNodeTail(c->vel->clients_to_close,c);
}

void freeClientsInAsyncFreeQueue(vr_eventloop *vel) {
    while (dlistLength(vel->clients_to_close)) {
        dlistNode *ln = dlistFirst(vel->clients_to_close);
        client *c = dlistNodeValue(ln);

        c->flags &= ~CLIENT_CLOSE_ASAP;
        freeClient(c);
        dlistDelNode(vel->clients_to_close,ln);
    }
}

/* Write data in output buffers to client. Return VR_OK if the client
 * is still valid after the call, VR_ERROR if it was freed. */
int writeToClient(int fd, client *c, int handler_installed) {
    ssize_t nwritten = 0, totwritten = 0;
    size_t objlen;
    size_t objmem;
    robj *o;
    long long maxmemory;

    maxmemory = c->vel->cc.maxmemory;
    while(clientHasPendingReplies(c)) {
        if (c->bufpos > 0) {
            nwritten = vr_write(fd,c->buf+c->sentlen,c->bufpos-c->sentlen);
            if (nwritten <= 0) break;
            c->sentlen += nwritten;
            totwritten += nwritten;

            /* If the buffer was sent, set bufpos to zero to continue with
             * the remainder of the reply. */
            if ((int)c->sentlen == c->bufpos) {
                c->bufpos = 0;
                c->sentlen = 0;
            }
        } else {
            o = dlistNodeValue(dlistFirst(c->reply));
            objlen = sdslen(o->ptr);
            objmem = getStringObjectSdsUsedMemory(o);

            if (objlen == 0) {
                dlistDelNode(c->reply,dlistFirst(c->reply));
                c->reply_bytes -= objmem;
                continue;
            }

            nwritten = vr_write(fd, ((char*)o->ptr)+c->sentlen,objlen-c->sentlen);
            if (nwritten <= 0) break;
            c->sentlen += nwritten;
            totwritten += nwritten;

            /* If we fully sent the object on head go to the next one */
            if (c->sentlen == objlen) {
                dlistDelNode(c->reply,dlistFirst(c->reply));
                c->sentlen = 0;
                c->reply_bytes -= objmem;
            }
        }
        /* Note that we avoid to send more than NET_MAX_WRITES_PER_EVENT
         * bytes, in a single threaded server it's a good idea to serve
         * other clients as well, even if a very large request comes from
         * super fast link that is always able to accept data (in real world
         * scenario think about 'KEYS *' against the loopback interface).
         *
         * However if we are over the maxmemory limit we ignore that and
         * just deliver as much data as it is possible to deliver. */
        if (totwritten > NET_MAX_WRITES_PER_EVENT &&
            (maxmemory == 0 || dalloc_used_memory() < maxmemory)) 
            break;
    }
    if (nwritten == -1) {
        if (errno == EAGAIN) {
            nwritten = 0;
        } else {
            log_debug(LOG_VERB,
                "error writing to client: %s", strerror(errno));
            freeClient(c);
            return VR_ERROR;
        }
    }
    if (totwritten > 0) {
        update_stats_add(c->vel->stats, net_output_bytes, (long long)totwritten);
        /* For clients representing masters we don't count sending data
         * as an interaction, since we always send REPLCONF ACK commands
         * that take some time to just fill the socket output buffer.
         * We just rely on data / pings received for timeout detection. */
        if (!(c->flags & CLIENT_MASTER)) c->lastinteraction = c->vel->unixtime;
    }
    if (!clientHasPendingReplies(c)) {
        c->sentlen = 0;
        if (handler_installed) aeDeleteFileEvent(c->vel->el,c->conn->sd,AE_WRITABLE);

        /* Close connection after entire reply has been sent. */
        if (c->flags & CLIENT_CLOSE_AFTER_REPLY) {
            freeClient(c);
            return VR_ERROR;
        }
    }
    return VR_OK;
}

/* Write event handler. Just send data to the client. */
void sendReplyToClient(aeEventLoop *el, int fd, void *privdata, int mask) {
    UNUSED(el);
    UNUSED(mask);
    writeToClient(fd,privdata,1);
}

/* This function is called just before entering the event loop, in the hope
 * we can just write the replies to the client output buffer without any
 * need to use a syscall in order to install the writable event handler,
 * get it called, and so forth. */
int handleClientsWithPendingWrites(vr_eventloop *vel) {
    dlistIter li;
    dlistNode *ln;
    int processed = dlistLength(vel->clients_pending_write);

    dlistRewind(vel->clients_pending_write,&li);
    while((ln = dlistNext(&li))) {
        client *c = dlistNodeValue(ln);
        c->flags &= ~CLIENT_PENDING_WRITE;
        dlistDelNode(vel->clients_pending_write,ln);

        /* Try to write buffers to the client socket. */
        if (writeToClient(c->conn->sd,c,0) == VR_ERROR) continue;

        /* If there is nothing left, do nothing. Otherwise install
         * the write handler. */
        if (clientHasPendingReplies(c) &&
            aeCreateFileEvent(vel->el, c->conn->sd, AE_WRITABLE,
                sendReplyToClient, c) == AE_ERR)
        {
            freeClientAsync(c);
        }
    }
    return processed;
}

/* resetClient prepare the client to process the next command */
void resetClient(client *c) {
    redisCommandProc *prevcmd = c->cmd ? c->cmd->proc : NULL;

    if (c->flags&CLIENT_JUMP)
        return;

    freeClientArgv(c);
    c->reqtype = 0;
    c->multibulklen = 0;
    c->bulklen = -1;

    /* Remove the CLIENT_REPLY_SKIP flag if any so that the reply
     * to the next command will be sent, but set the flag if the command
     * we just processed was "CLIENT REPLY SKIP". */
    c->flags &= ~CLIENT_REPLY_SKIP;
    if (c->flags & CLIENT_REPLY_SKIP_NEXT) {
        c->flags |= CLIENT_REPLY_SKIP;
        c->flags &= ~CLIENT_REPLY_SKIP_NEXT;
    }
}

int processInlineBuffer(client *c) {
    char *newline;
    int argc, j;
    sds *argv, aux;
    size_t querylen;

    /* Search for end of line */
    newline = strchr(c->querybuf,'\n');

    /* Nothing to do without a \r\n */
    if (newline == NULL) {
        if (sdslen(c->querybuf) > PROTO_INLINE_MAX_SIZE) {
            addReplyError(c,"Protocol error: too big inline request");
            setProtocolError(c,0);
        }
        return VR_ERROR;
    }

    /* Handle the \r\n case. */
    if (newline && newline != c->querybuf && *(newline-1) == '\r')
        newline--;

    /* Split the input buffer up to the \r\n */
    querylen = newline-(c->querybuf);
    aux = sdsnewlen(c->querybuf,querylen);
    argv = sdssplitargs(aux,&argc);
    sdsfree(aux);
    if (argv == NULL) {
        addReplyError(c,"Protocol error: unbalanced quotes in request");
        setProtocolError(c,0);
        return VR_ERROR;
    }

    /* Newline from slaves can be used to refresh the last ACK time.
     * This is useful for a slave to ping back while loading a big
     * RDB file. */
    if (querylen == 0 && c->flags & CLIENT_SLAVE)
        c->repl_ack_time = c->vel->unixtime;

    /* Leave data after the first line of the query in the buffer */
    sdsrange(c->querybuf,querylen+2,-1);

    /* Setup argv array on client structure */
    if (argc) {
        if (c->argv) dfree(c->argv);
        c->argv = dalloc(sizeof(robj*)*argc);
    }

    /* Create redis objects for all arguments. */
    for (c->argc = 0, j = 0; j < argc; j++) {
        if (sdslen(argv[j])) {
            c->argv[c->argc] = createObject(OBJ_STRING,argv[j]);
            c->argc++;
        } else {
            sdsfree(argv[j]);
        }
    }
    dfree(argv);
    return VR_OK;
}

/* Helper function. Trims query buffer to make the function that processes
 * multi bulk requests idempotent. */
static void setProtocolError(client *c, int pos) {
    if (log_loggable(LOG_VERB)) {
        sds client = catClientInfoString(sdsempty(),c);
        log_debug(LOG_VERB,
            "Protocol error from client: %s", client);
        sdsfree(client);
    }
    c->flags |= CLIENT_CLOSE_AFTER_REPLY;
    sdsrange(c->querybuf,pos,-1);
}

int processMultibulkBuffer(client *c) {
    char *newline = NULL;
    int pos = 0, ok;
    long long ll;

    if (c->multibulklen == 0) {
        /* The client should have been reset */
        serverAssertWithInfo(c,NULL,c->argc == 0);

        /* Multi bulk length cannot be read without a \r\n */
        newline = strchr(c->querybuf,'\r');
        if (newline == NULL) {
            if (sdslen(c->querybuf) > PROTO_INLINE_MAX_SIZE) {
                addReplyError(c,"Protocol error: too big mbulk count string");
                setProtocolError(c,0);
            }
            return VR_ERROR;
        }

        /* Buffer should also contain \n */
        if (newline-(c->querybuf) > ((signed)sdslen(c->querybuf)-2))
            return VR_ERROR;

        /* We know for sure there is a whole line since newline != NULL,
         * so go ahead and find out the multi bulk length. */
        serverAssertWithInfo(c,NULL,c->querybuf[0] == '*');
        ok = string2ll(c->querybuf+1,newline-(c->querybuf+1),&ll);
        if (!ok || ll > 1024*1024) {
            addReplyError(c,"Protocol error: invalid multibulk length");
            setProtocolError(c,pos);
            return VR_ERROR;
        }

        pos = (newline-c->querybuf)+2;
        if (ll <= 0) {
            sdsrange(c->querybuf,pos,-1);
            return VR_OK;
        }

        c->multibulklen = ll;

        /* Setup argv array on client structure */
        if (c->argv) dfree(c->argv);
        c->argv = dalloc(sizeof(robj*)*c->multibulklen);
    }

    serverAssertWithInfo(c,NULL,c->multibulklen > 0);
    while(c->multibulklen) {
        /* Read bulk length if unknown */
        if (c->bulklen == -1) {
            newline = strchr(c->querybuf+pos,'\r');
            if (newline == NULL) {
                if (sdslen(c->querybuf) > PROTO_INLINE_MAX_SIZE) {
                    addReplyError(c,
                        "Protocol error: too big bulk count string");
                    setProtocolError(c,0);
                    return VR_ERROR;
                }
                break;
            }

            /* Buffer should also contain \n */
            if (newline-(c->querybuf) > ((signed)sdslen(c->querybuf)-2))
                break;

            if (c->querybuf[pos] != '$') {
                addReplyErrorFormat(c,
                    "Protocol error: expected '$', got '%c'",
                    c->querybuf[pos]);
                setProtocolError(c,pos);
                return VR_ERROR;
            }

            ok = string2ll(c->querybuf+pos+1,newline-(c->querybuf+pos+1),&ll);
            if (!ok || ll < 0 || ll > 512*1024*1024) {
                addReplyError(c,"Protocol error: invalid bulk length");
                setProtocolError(c,pos);
                return VR_ERROR;
            }

            pos += newline-(c->querybuf+pos)+2;
            if (ll >= PROTO_MBULK_BIG_ARG) {
                size_t qblen;

                /* If we are going to read a large object from network
                 * try to make it likely that it will start at c->querybuf
                 * boundary so that we can optimize object creation
                 * avoiding a large copy of data. */
                sdsrange(c->querybuf,pos,-1);
                pos = 0;
                qblen = sdslen(c->querybuf);
                /* Hint the sds library about the amount of bytes this string is
                 * going to contain. */
                if (qblen < (size_t)ll+2)
                    c->querybuf = sdsMakeRoomFor(c->querybuf,ll+2-qblen);
            }
            c->bulklen = ll;
        }

        /* Read bulk argument */
        if (sdslen(c->querybuf)-pos < (unsigned)(c->bulklen+2)) {
            /* Not enough data (+2 == trailing \r\n) */
            break;
        } else {
            /* Optimization: if the buffer contains JUST our bulk element
             * instead of creating a new object by *copying* the sds we
             * just use the current sds string. */
            if (pos == 0 &&
                c->bulklen >= PROTO_MBULK_BIG_ARG &&
                (signed) sdslen(c->querybuf) == c->bulklen+2)
            {
                c->argv[c->argc++] = createObject(OBJ_STRING,c->querybuf);
                sdsIncrLen(c->querybuf,-2); /* remove CRLF */
                /* Assume that if we saw a fat argument we'll see another one
                 * likely... */
                c->querybuf = sdsnewlen(NULL,c->bulklen+2);
                sdsclear(c->querybuf);
                pos = 0;
            } else {
                c->argv[c->argc++] =
                    createStringObject(c->querybuf+pos,c->bulklen);
                pos += c->bulklen+2;
            }
            c->bulklen = -1;
            c->multibulklen--;
        }
    }

    /* Trim to pos */
    if (pos) sdsrange(c->querybuf,pos,-1);

    /* We're done when c->multibulk == 0 */
    if (c->multibulklen == 0) return VR_OK;

    /* Still not read to process the command */
    return VR_ERROR;
}

void processInputBuffer(client *c) {
    c->vel->current_client = c;
    /* Keep processing while there is something in the input buffer */
    while(sdslen(c->querybuf)) {
        /* Return if clients are paused. */
        if (!(c->flags & CLIENT_SLAVE) && clientsArePaused(c->vel)) break;

        /* Immediately abort if the client is in the middle of something. */
        if (c->flags & CLIENT_BLOCKED) break;

        /* CLIENT_CLOSE_AFTER_REPLY closes the connection once the reply is
         * written to the client. Make sure to not let the reply grow after
         * this flag has been set (i.e. don't process more commands). */
        if (c->flags & CLIENT_CLOSE_AFTER_REPLY) break;

        /* Determine request type when unknown. */
        if (!c->reqtype) {
            if (c->querybuf[0] == '*') {
                c->reqtype = PROTO_REQ_MULTIBULK;
            } else {
                c->reqtype = PROTO_REQ_INLINE;
            }
        }

        if (c->reqtype == PROTO_REQ_INLINE) {
            if (processInlineBuffer(c) != VR_OK) break;
        } else if (c->reqtype == PROTO_REQ_MULTIBULK) {
            if (processMultibulkBuffer(c) != VR_OK) break;
        } else {
            serverPanic("Unknown request type");
        }

        /* Multibulk processing could see a <= 0 length. */
        if (c->argc == 0) {
            resetClient(c);
        } else {
            /* Only reset the client when the command was executed. */
            if (processCommand(c) == VR_OK)
                resetClient(c);
            /* freeMemoryIfNeeded may flush slave output buffers. This may result
             * into a slave, that may be the active client, to be freed. */
            if (c->vel->current_client == NULL) break;

            /* If this client need to jump to another worker,
             * break this while loop. When this client jumped finished, 
             * continue handle the remain query buffer. */
            if (c->flags&CLIENT_JUMP) break;
        }
    }
    c->vel->current_client = NULL;
}

void readQueryFromClient(aeEventLoop *el, int fd, void *privdata, int mask) {
    client *c = (client*) privdata;
    int nread, readlen;
    size_t qblen;
    UNUSED(el);
    UNUSED(mask);

    readlen = PROTO_IOBUF_LEN;
    /* If this is a multi bulk request, and we are processing a bulk reply
     * that is large enough, try to maximize the probability that the query
     * buffer contains exactly the SDS string representing the object, even
     * at the risk of requiring more read(2) calls. This way the function
     * processMultiBulkBuffer() can avoid copying buffers to create the
     * Redis Object representing the argument. */
    if (c->reqtype == PROTO_REQ_MULTIBULK && c->multibulklen && c->bulklen != -1
        && c->bulklen >= PROTO_MBULK_BIG_ARG)
    {
        int remaining = (unsigned)(c->bulklen+2)-sdslen(c->querybuf);

        if (remaining < readlen) readlen = remaining;
    }

    qblen = sdslen(c->querybuf);
    if (c->querybuf_peak < qblen) c->querybuf_peak = qblen;
    c->querybuf = sdsMakeRoomFor(c->querybuf, readlen);
    nread = vr_read(fd, c->querybuf+qblen, readlen);
    if (nread == -1) {
        if (errno == EAGAIN) {
            return;
        } else {
            log_debug(LOG_VERB, "reading from client: %s",strerror(errno));
            freeClient(c);
            return;
        }
    } else if (nread == 0) {
        log_debug(LOG_VERB, "client closed connection");
        freeClient(c);
        return;
    }

    sdsIncrLen(c->querybuf,nread);
    c->lastinteraction = c->vel->unixtime;
    if (c->flags & CLIENT_MASTER) c->reploff += nread;
    update_stats_add(c->vel->stats, net_input_bytes, nread);
    if (sdslen(c->querybuf) > server.client_max_querybuf_len) {
        sds ci = catClientInfoString(sdsempty(),c), bytes = sdsempty();

        bytes = sdscatrepr(bytes,c->querybuf,64);
        log_warn("closing client that reached max query buffer length: %s (qbuf initial bytes: %s)", ci, bytes);
        sdsfree(ci);
        sdsfree(bytes);
        freeClient(c);
        return;
    }
    processInputBuffer(c);

    if (c->flags&CLIENT_JUMP) {
        dispatch_conn_exist(c,c->taridx);
    }
}

void getClientsMaxBuffers(vr_eventloop *vel, unsigned long *longest_output_list,
                          unsigned long *biggest_input_buffer) {
    client *c;
    dlistNode *ln;
    dlistIter li;
    unsigned long lol = 0, bib = 0;

    dlistRewind(vel->clients,&li);
    while ((ln = dlistNext(&li)) != NULL) {
        c = dlistNodeValue(ln);

        if (dlistLength(c->reply) > lol) lol = dlistLength(c->reply);
        if (sdslen(c->querybuf) > bib) bib = sdslen(c->querybuf);
    }
    *longest_output_list = lol;
    *biggest_input_buffer = bib;
}

/* A Redis "Peer ID" is a colon separated ip:port pair.
 * For IPv4 it's in the form x.y.z.k:port, example: "127.0.0.1:1234".
 * For IPv6 addresses we use [] around the IP part, like in "[::1]:1234".
 * For Unix sockets we use path:0, like in "/tmp/redis:0".
 *
 * A Peer ID always fits inside a buffer of NET_PEER_ID_LEN bytes, including
 * the null term.
 *
 * On failure the function still populates 'peerid' with the "?:0" string
 * in case you want to relax error checking or need to display something
 * anyway (see anetPeerToString implementation for more info). */
void genClientPeerId(client *client, char *peerid,
                            size_t peerid_len) {
    if (client->flags & CLIENT_UNIX_SOCKET) {
        /* Unix socket client. */
        snprintf(peerid,peerid_len,"%s:0",server.unixsocket);
    } else {
        /* TCP client. */
        vr_net_format_peer(client->conn->sd,peerid,peerid_len);
    }
}

/* This function returns the client peer id, by creating and caching it
 * if client->peerid is NULL, otherwise returning the cached value.
 * The Peer ID never changes during the life of the client, however it
 * is expensive to compute. */
char *getClientPeerId(client *c) {
    char peerid[VR_INET_PEER_ID_LEN];

    if (c->peerid == NULL) {
        genClientPeerId(c,peerid,sizeof(peerid));
        c->peerid = sdsnew(peerid);
    }
    return c->peerid;
}

/* Concatenate a string representing the state of a client in an human
 * readable format, into the sds string 's'. */
sds catClientInfoString(sds s, client *client) {
    char flags[16], events[3], *p;
    int emask;

    p = flags;
    if (client->flags & CLIENT_SLAVE) {
        if (client->flags & CLIENT_MONITOR)
            *p++ = 'O';
        else
            *p++ = 'S';
    }
    if (client->flags & CLIENT_MASTER) *p++ = 'M';
    if (client->flags & CLIENT_MULTI) *p++ = 'x';
    if (client->flags & CLIENT_BLOCKED) *p++ = 'b';
    if (client->flags & CLIENT_DIRTY_CAS) *p++ = 'd';
    if (client->flags & CLIENT_CLOSE_AFTER_REPLY) *p++ = 'c';
    if (client->flags & CLIENT_UNBLOCKED) *p++ = 'u';
    if (client->flags & CLIENT_CLOSE_ASAP) *p++ = 'A';
    if (client->flags & CLIENT_UNIX_SOCKET) *p++ = 'U';
    if (client->flags & CLIENT_READONLY) *p++ = 'r';
    if (p == flags) *p++ = 'N';
    *p++ = '\0';

    emask = client->conn->sd == -1 ? 0 : aeGetFileEvents(client->vel->el,client->conn->sd);
    p = events;
    if (emask & AE_READABLE) *p++ = 'r';
    if (emask & AE_WRITABLE) *p++ = 'w';
    *p = '\0';
    
    return sdscatfmt(s,
        "oid=%i id=%U addr=%s fd=%i name=%s age=%I idle=%I flags=%s db=%i sub=%i psub=%i multi=%i qbuf=%U qbuf-free=%U obl=%U oll=%U omem=%U events=%s cmd=%s",
        client->curidx,
        (unsigned long long) client->id,
        getClientPeerId(client),
        client->conn->sd,
        client->name ? (char*)client->name->ptr : "",
        (long long)(client->vel->unixtime - client->ctime),
        (long long)(client->vel->unixtime - client->lastinteraction),
        flags,
        client->dictid,
        (int) dictSize(client->pubsub_channels),
        (int) dlistLength(client->pubsub_patterns),
        (client->flags & CLIENT_MULTI) ? client->mstate.count : -1,
        (unsigned long long) sdslen(client->querybuf),
        (unsigned long long) sdsavail(client->querybuf),
        (unsigned long long) client->bufpos,
        (unsigned long long) dlistLength(client->reply),
        (unsigned long long) getClientOutputBufferMemoryUsage(client),
        events,
        client->lastcmd ? client->lastcmd->name : "NULL");
}

sds getAllClientsInfoString(vr_eventloop *vel) {
    dlistNode *ln;
    dlistIter li;
    client *client;
    sds o = sdsnewlen(NULL,200*dlistLength(vel->clients));
    sdsclear(o);
    dlistRewind(vel->clients,&li);
    while ((ln = dlistNext(&li)) != NULL) {
        client = dlistNodeValue(ln);
        o = catClientInfoString(o,client);
        o = sdscatlen(o,"\n",1);
    }
    return o;
}

struct clientkilldata {
    sds addr;
    int type;
    uint64_t id;
    int skipme;
    int killed;
    int close_this_client;
};

void clientCommand(client *c) {
    dlistNode *ln;
    dlistIter li;
    client *client;

    if (!strcasecmp(c->argv[1]->ptr,"list") && c->argc == 2) {
        /* CLIENT LIST */
        sds str = c->cache;
        sds o = getAllClientsInfoString(c->vel);

        str = sdscatsds(str?str:sdsempty(),o);

        if (c->steps >= (darray_n(&workers) - 1)) {
            addReplyBulkCBuffer(c,str,sdslen(str));
            c->steps = 0;
            c->taridx = -1;
            sdsfree(str);
            c->cache = NULL;
            c->flags &= ~CLIENT_JUMP;
        } else {
            if (!(c->flags&CLIENT_JUMP))
                c->flags |= CLIENT_JUMP;
            c->taridx = worker_get_next_idx(c->curidx);
            c->cache = str;
        }
        sdsfree(o);
        return;
    } else if (!strcasecmp(c->argv[1]->ptr,"kill")) {
        /* CLIENT KILL <ip:port>
         * CLIENT KILL <option> [value] ... <option> [value] */
        struct clientkilldata *ckd;

        if (c->steps == 0) {
            ckd = dalloc(sizeof(struct clientkilldata));
            ckd->addr = NULL;
            ckd->type = -1;
            ckd->id = 0;
            ckd->skipme = 1;
            ckd->killed = 0;
            ckd->close_this_client = 0;

            if (c->argc == 3) {
                /* Old style syntax: CLIENT KILL <addr> */
                ckd->addr = sdsnew(c->argv[2]->ptr);
                ckd->skipme = 0; /* With the old form, you can kill yourself. */
            } else if (c->argc > 3) {
                int i = 2; /* Next option index. */
    
                /* New style syntax: parse options. */
                while(i < c->argc) {
                    int moreargs = c->argc > i+1;
    
                    if (!strcasecmp(c->argv[i]->ptr,"id") && moreargs) {
                        long long tmp;
    
                        if (getLongLongFromObjectOrReply(c,c->argv[i+1],&tmp,NULL)
                            != VR_OK) {
                            if (ckd->addr) sdsfree(ckd->addr);
                            dfree(ckd);
                            return;
                        }
                        ckd->id = tmp;
                    } else if (!strcasecmp(c->argv[i]->ptr,"type") && moreargs) {
                        ckd->type = getClientTypeByName(c->argv[i+1]->ptr);
                        if (ckd->type == -1) {
                            if (ckd->addr) sdsfree(ckd->addr);
                            dfree(ckd);
                            addReplyErrorFormat(c,"Unknown client type '%s'",
                                (char*) c->argv[i+1]->ptr);
                            return;
                        }
                    } else if (!strcasecmp(c->argv[i]->ptr,"addr") && moreargs) {
                        ckd->addr = sdsnew(c->argv[i+1]->ptr);
                    } else if (!strcasecmp(c->argv[i]->ptr,"skipme") && moreargs) {
                        if (!strcasecmp(c->argv[i+1]->ptr,"yes")) {
                            ckd->skipme = 1;
                        } else if (!strcasecmp(c->argv[i+1]->ptr,"no")) {
                            ckd->skipme = 0;
                        } else {
                            if (ckd->addr) sdsfree(ckd->addr);
                            dfree(ckd);
                            addReply(c,shared.syntaxerr);
                            return;
                        }
                    } else {
                        if (ckd->addr) sdsfree(ckd->addr);
                        dfree(ckd);
                        addReply(c,shared.syntaxerr);
                        return;
                    }
                    i += 2;
                }
            } else {
                if (ckd->addr) sdsfree(ckd->addr);
                dfree(ckd);
                addReply(c,shared.syntaxerr);
                return;
            }

            if (!(c->flags&CLIENT_JUMP))
                c->flags |= CLIENT_JUMP;
            c->taridx = worker_get_next_idx(c->curidx);
            c->cache = ckd;
        } else {
            ckd = c->cache;
            c->taridx = worker_get_next_idx(c->curidx);
        }

        /* Iterate clients killing all the matching clients. */
        dlistRewind(c->vel->clients,&li);
        while ((ln = dlistNext(&li)) != NULL) {
            client = dlistNodeValue(ln);
            if (ckd->addr && strcmp(getClientPeerId(client),ckd->addr) != 0) continue;
            if (ckd->type != -1 && getClientType(client) != ckd->type) continue;
            if (ckd->id != 0 && client->id != ckd->id) continue;
            if (c == client && ckd->skipme) continue;

            /* Kill it. */
            if (c == client) {
                ckd->close_this_client = 1;
            } else {
                freeClient(client);
            }
            ckd->killed++;
        }

        if (c->steps >= (darray_n(&workers) - 1)) {
            /* Reply according to old/new format. */
            if (c->argc == 3) {
                if (ckd->killed == 0)
                    addReplyError(c,"No such client");
                else
                    addReply(c,shared.ok);
            } else {
                addReplyLongLong(c,ckd->killed);
            }
            
            c->steps = 0;
            c->taridx = -1;
            c->cache = NULL;
            c->flags &= ~CLIENT_JUMP;
            
            /* If this client has to be closed, flag it as CLOSE_AFTER_REPLY
             * only after we queued the reply to its output buffers. */
            if (ckd->close_this_client) c->flags |= CLIENT_CLOSE_AFTER_REPLY;

            if (ckd->addr) sdsfree(ckd->addr);
            dfree(ckd);
        }

        return;
    } else if (!strcasecmp(c->argv[1]->ptr,"setname") && c->argc == 3) {
        int j, len = sdslen(c->argv[2]->ptr);
        char *p = c->argv[2]->ptr;

        /* Setting the client name to an empty string actually removes
         * the current name. */
        if (len == 0) {
            if (c->name) freeObject(c->name);
            c->name = NULL;
            addReply(c,shared.ok);
            return;
        }

        /* Otherwise check if the charset is ok. We need to do this otherwise
         * CLIENT LIST format will break. You should always be able to
         * split by space to get the different fields. */
        for (j = 0; j < len; j++) {
            if (p[j] < '!' || p[j] > '~') { /* ASCII is assumed. */
                addReplyError(c,
                    "Client names cannot contain spaces, "
                    "newlines or special characters.");
                return;
            }
        }
        if (c->name) freeObject(c->name);
        c->name = dupStringObjectUnconstant(c->argv[2]);
        addReply(c,shared.ok);
        return;
    } else if (!strcasecmp(c->argv[1]->ptr,"getname") && c->argc == 2) {
        if (c->name)
            addReplyBulk(c,c->name);
        else
            addReply(c,shared.nullbulk);
        return;
    } else {
        addReplyError(c, "Syntax error, try CLIENT (LIST | KILL ip:port | SETNAME connection-name)");
        return;
    }

    if (!strcasecmp(c->argv[1]->ptr,"reply") && c->argc == 3) {
        /* CLIENT REPLY ON|OFF|SKIP */
        if (!strcasecmp(c->argv[2]->ptr,"on")) {
            c->flags &= ~(CLIENT_REPLY_SKIP|CLIENT_REPLY_OFF);
            addReply(c,shared.ok);
        } else if (!strcasecmp(c->argv[2]->ptr,"off")) {
            c->flags |= CLIENT_REPLY_OFF;
        } else if (!strcasecmp(c->argv[2]->ptr,"skip")) {
            if (!(c->flags & CLIENT_REPLY_OFF))
                c->flags |= CLIENT_REPLY_SKIP_NEXT;
        } else {
            addReply(c,shared.syntaxerr);
            return;
        }
    } else if (!strcasecmp(c->argv[1]->ptr,"pause") && c->argc == 3) {
        long long duration;

        if (getTimeoutFromObjectOrReply(c,c->argv[2],&duration,UNIT_MILLISECONDS)
                                        != VR_OK) return;
        pauseClients(NULL, duration);
        addReply(c,shared.ok);
    } else {
        addReplyError(c, "Syntax error, try CLIENT (LIST | KILL ip:port | GETNAME | SETNAME connection-name)");
    }
}

/* Rewrite the command vector of the client. All the new objects should 
 * be independent. The old command vector is freed. */
void rewriteClientCommandVector(client *c, int argc, ...) {
    va_list ap;
    int j;
    robj **argv; /* The new argument vector */

    argv = dalloc(sizeof(robj*)*argc);
    va_start(ap,argc);
    for (j = 0; j < argc; j++) {
        robj *a;
        a = va_arg(ap, robj*);
        argv[j] = a;
    }
    /* We free the objects in the original vector at the end. */
    for (j = 0; j < c->argc; j++) freeObject(c->argv[j]);
    dfree(c->argv);
    /* Replace argv and argc with our new versions. */
    c->argv = argv;
    c->argc = argc;
    c->cmd = lookupCommandOrOriginal(c->argv[0]->ptr);
    serverAssertWithInfo(c,NULL,c->cmd != NULL);
    va_end(ap);
}

/* Completely replace the client command vector with the provided one. */
void replaceClientCommandVector(client *c, int argc, robj **argv) {
    freeClientArgv(c);
    dfree(c->argv);
    c->argv = argv;
    c->argc = argc;
    c->cmd = lookupCommandOrOriginal(c->argv[0]->ptr);
    serverAssertWithInfo(c,NULL,c->cmd != NULL);
}

/* Rewrite a single item in the command vector.
 * The new val should be independent, and the old freed.
 *
 * It is possible to specify an argument over the current size of the
 * argument vector: in this case the array of objects gets reallocated
 * and c->argc set to the max value. However it's up to the caller to
 *
 * 1. Make sure there are no "holes" and all the arguments are set.
 * 2. If the original argument vector was longer than the one we
 *    want to end with, it's up to the caller to set c->argc and
 *    free the no longer used objects on c->argv. */
void rewriteClientCommandArgument(client *c, int i, robj *newval) {
    robj *oldval;

    if (i >= c->argc) {
        c->argv = drealloc(c->argv,sizeof(robj*)*(i+1));
        c->argc = i+1;
        c->argv[i] = NULL;
    }
    oldval = c->argv[i];
    c->argv[i] = newval;
    if (oldval) freeObject(oldval);

    /* If this is the command name make sure to fix c->cmd. */
    if (i == 0) {
        c->cmd = lookupCommandOrOriginal(c->argv[0]->ptr);
        serverAssertWithInfo(c,NULL,c->cmd != NULL);
    }
}

/* This function returns the number of bytes that Redis is virtually
 * using to store the reply still not read by the client.
 * It is "virtual" since the reply output list may contain objects that
 * are shared and are not really using additional memory.
 *
 * The function returns the total sum of the length of all the objects
 * stored in the output list, plus the memory used to allocate every
 * list node. The static reply buffer is not taken into account since it
 * is allocated anyway.
 *
 * Note: this function is very fast so can be called as many time as
 * the caller wishes. The main usage of this function currently is
 * enforcing the client output length limits. */
unsigned long getClientOutputBufferMemoryUsage(client *c) {
    unsigned long list_item_size = sizeof(dlistNode)+sizeof(robj);

    return c->reply_bytes + (list_item_size*dlistLength(c->reply));
}

/* Get the class of a client, used in order to enforce limits to different
 * classes of clients.
 *
 * The function will return one of the following:
 * CLIENT_TYPE_NORMAL -> Normal client
 * CLIENT_TYPE_SLAVE  -> Slave or client executing MONITOR command
 * CLIENT_TYPE_PUBSUB -> Client subscribed to Pub/Sub channels
 * CLIENT_TYPE_MASTER -> The client representing our replication master.
 */
int getClientType(client *c) {
    if (c->flags & CLIENT_MASTER) return CLIENT_TYPE_MASTER;
    if ((c->flags & CLIENT_SLAVE) && !(c->flags & CLIENT_MONITOR))
        return CLIENT_TYPE_SLAVE;
    if (c->flags & CLIENT_PUBSUB) return CLIENT_TYPE_PUBSUB;
    return CLIENT_TYPE_NORMAL;
}

int getClientTypeByName(char *name) {
    if (!strcasecmp(name,"normal")) return CLIENT_TYPE_NORMAL;
    else if (!strcasecmp(name,"slave")) return CLIENT_TYPE_SLAVE;
    else if (!strcasecmp(name,"pubsub")) return CLIENT_TYPE_PUBSUB;
    else if (!strcasecmp(name,"master")) return CLIENT_TYPE_MASTER;
    else return -1;
}

char *getClientTypeName(int class) {
    switch(class) {
    case CLIENT_TYPE_NORMAL: return "normal";
    case CLIENT_TYPE_SLAVE:  return "slave";
    case CLIENT_TYPE_PUBSUB: return "pubsub";
    case CLIENT_TYPE_MASTER: return "master";
    default:                       return NULL;
    }
}

/* The function checks if the client reached output buffer soft or hard
 * limit, and also update the state needed to check the soft limit as
 * a side effect.
 *
 * Return value: non-zero if the client reached the soft or the hard limit.
 *               Otherwise zero is returned. */
int checkClientOutputBufferLimits(client *c) {
    int soft = 0, hard = 0, class;
    unsigned long used_mem = getClientOutputBufferMemoryUsage(c);

    class = getClientType(c);
    /* For the purpose of output buffer limiting, masters are handled
     * like normal clients. */
    if (class == CLIENT_TYPE_MASTER) class = CLIENT_TYPE_NORMAL;

    if (server.client_obuf_limits[class].hard_limit_bytes &&
        used_mem >= server.client_obuf_limits[class].hard_limit_bytes)
        hard = 1;
    if (server.client_obuf_limits[class].soft_limit_bytes &&
        used_mem >= server.client_obuf_limits[class].soft_limit_bytes)
        soft = 1;

    /* We need to check if the soft limit is reached continuously for the
     * specified amount of seconds. */
    if (soft) {
        if (c->obuf_soft_limit_reached_time == 0) {
            c->obuf_soft_limit_reached_time = c->vel->unixtime;
            soft = 0; /* First time we see the soft limit reached */
        } else {
            time_t elapsed = c->vel->unixtime - c->obuf_soft_limit_reached_time;

            if (elapsed <=
                server.client_obuf_limits[class].soft_limit_seconds) {
                soft = 0; /* The client still did not reached the max number of
                             seconds for the soft limit to be considered
                             reached. */
            }
        }
    } else {
        c->obuf_soft_limit_reached_time = 0;
    }
    return soft || hard;
}

/* Asynchronously close a client if soft or hard limit is reached on the
 * output buffer size. The caller can check if the client will be closed
 * checking if the client CLIENT_CLOSE_ASAP flag is set.
 *
 * Note: we need to close the client asynchronously because this function is
 * called from contexts where the client can't be freed safely, i.e. from the
 * lower level functions pushing data inside the client output buffers. */
void asyncCloseClientOnOutputBufferLimitReached(client *c) {
    ASSERT(c->reply_bytes < SIZE_MAX-(1024*64));
    if (c->reply_bytes == 0 || c->flags & CLIENT_CLOSE_ASAP) return;
    if (checkClientOutputBufferLimits(c)) {
        sds client = catClientInfoString(sdsempty(),c);

        freeClientAsync(c);
        log_warn("Client %s scheduled to be closed ASAP for overcoming of output buffer limits.", client);
        sdsfree(client);
    }
}

/* Helper function used by freeMemoryIfNeeded() in order to flush slaves
 * output buffers without returning control to the event loop.
 * This is also called by SHUTDOWN for a best-effort attempt to send
 * slaves the latest writes. */
void flushSlavesOutputBuffers(void) {
    dlistIter li;
    dlistNode *ln;

    dlistRewind(repl.slaves,&li);
    while((ln = dlistNext(&li))) {
        client *slave = dlistNodeValue(ln);
        int events;

        /* Note that the following will not flush output buffers of slaves
         * in STATE_ONLINE but having put_online_on_ack set to true: in this
         * case the writable event is never installed, since the purpose
         * of put_online_on_ack is to postpone the moment it is installed.
         * This is what we want since slaves in this state should not receive
         * writes before the first ACK. */
        events = aeGetFileEvents(repl.vel.el,slave->conn->sd);
        if (events & AE_WRITABLE &&
            slave->replstate == SLAVE_STATE_ONLINE &&
            clientHasPendingReplies(slave))
        {
            writeToClient(slave->conn->sd,slave,0);
        }
    }
}

/* Pause clients up to the specified unixtime (in ms). While clients
 * are paused no command is processed from clients, so the data set can't
 * change during that time.
 *
 * However while this function pauses normal and Pub/Sub clients, slaves are
 * still served, so this function can be used on server upgrades where it is
 * required that slaves process the latest bytes from the replication stream
 * before being turned to masters.
 *
 * This function is also internally used by Redis Cluster for the manual
 * failover procedure implemented by CLUSTER FAILOVER.
 *
 * The function always succeed, even if there is already a pause in progress.
 * In such a case, the pause is extended if the duration is more than the
 * time left for the previous duration. However if the duration is smaller
 * than the time left for the previous pause, no change is made to the
 * left duration. */
void pauseClients(vr_eventloop *vel, long long end) {
    if (vel == NULL) return;

    if (!vel->clients_paused || end > vel->clients_pause_end_time)
        vel->clients_pause_end_time = end;
    vel->clients_paused = 1;
}

/* Return non-zero if clients are currently paused. As a side effect the
 * function checks if the pause time was reached and clear it. */
int clientsArePaused(vr_eventloop *vel) {
    if (vel->clients_paused &&
        vel->clients_pause_end_time < vel->mstime)
    {
        dlistNode *ln;
        dlistIter li;
        client *c;

        vel->clients_paused = 0;

        /* Put all the clients in the unblocked clients queue in order to
         * force the re-processing of the input buffer if any. */
        dlistRewind(vel->clients,&li);
        while ((ln = dlistNext(&li)) != NULL) {
            c = dlistNodeValue(ln);

            /* Don't touch slaves and blocked clients. The latter pending
             * requests be processed when unblocked. */
            if (c->flags & (CLIENT_SLAVE|CLIENT_BLOCKED)) continue;
            c->flags |= CLIENT_UNBLOCKED;
            dlistAddNodeTail(vel->unblocked_clients,c);
        }
    }
    return vel->clients_paused;
}

/* This function is called by Redis in order to process a few events from
 * time to time while blocked into some not interruptible operation.
 * This allows to reply to clients with the -LOADING error while loading the
 * data set at startup or after a full resynchronization with the master
 * and so forth.
 *
 * It calls the event loop in order to process a few events. Specifically we
 * try to call the event loop 4 times as long as we receive acknowledge that
 * some event was processed, in order to go forward with the accept, read,
 * write, close sequence needed to serve a client.
 *
 * The function returns the total number of events processed. */
int processEventsWhileBlocked(vr_eventloop *vel) {
    int iterations = 4; /* See the function top-comment. */
    int count = 0;
    while (iterations--) {
        int events = 0;
        events += aeProcessEvents(vel->el, AE_FILE_EVENTS|AE_DONT_WAIT);
        events += handleClientsWithPendingWrites(vel);
        if (!events) break;
        count += events;
    }
    return count;
}

int
current_clients(void)
{
    int ccs;

#if defined(__ATOMIC_RELAXED) || defined(HAVE_ATOMIC)
    ccs = update_curr_clients_add(0);
#else
    pthread_mutex_lock(&curr_clients_mutex);
    ccs = ncurr_cconn;
    pthread_mutex_unlock(&curr_clients_mutex);
#endif

    return ccs;
}


================================================
FILE: src/vr_client.h
================================================
#ifndef _VR_CLIENT_H_
#define _VR_CLIENT_H_

#define NET_MAX_WRITES_PER_EVENT (1024*64)

#define PROTO_MAX_QUERYBUF_LEN  (1024*1024*1024) /* 1GB max query buffer. */
#define PROTO_IOBUF_LEN         (1024*16)  /* Generic I/O buffer size */
#define PROTO_REPLY_CHUNK_BYTES (16*1024) /* 16k output buffer */
#define PROTO_INLINE_MAX_SIZE   (1024*64) /* Max size of inline reads */
#define PROTO_MBULK_BIG_ARG     (1024*32)

/* Client flags */
#define CLIENT_SLAVE (1<<0)   /* This client is a slave server */
#define CLIENT_MASTER (1<<1)  /* This client is a master server */
#define CLIENT_MONITOR (1<<2) /* This client is a slave monitor, see MONITOR */
#define CLIENT_MULTI (1<<3)   /* This client is in a MULTI context */
#define CLIENT_BLOCKED (1<<4) /* The client is waiting in a blocking operation */
#define CLIENT_DIRTY_CAS (1<<5) /* Watched keys modified. EXEC will fail. */
#define CLIENT_CLOSE_AFTER_REPLY (1<<6) /* Close after writing entire reply. */
#define CLIENT_UNBLOCKED (1<<7) /* This client was unblocked and is stored in
                                  server.unblocked_clients */
#define CLIENT_LUA (1<<8) /* This is a non connected client used by Lua */
#define CLIENT_ASKING (1<<9)     /* Client issued the ASKING command */
#define CLIENT_CLOSE_ASAP (1<<10)/* Close this client ASAP */
#define CLIENT_UNIX_SOCKET (1<<11) /* Client connected via Unix domain socket */
#define CLIENT_DIRTY_EXEC (1<<12)  /* EXEC will fail for errors while queueing */
#define CLIENT_MASTER_FORCE_REPLY (1<<13)  /* Queue replies even if is master */
#define CLIENT_FORCE_AOF (1<<14)   /* Force AOF propagation of current cmd. */
#define CLIENT_FORCE_REPL (1<<15)  /* Force replication of current cmd. */
#define CLIENT_PRE_PSYNC (1<<16)   /* Instance don't understand PSYNC. */
#define CLIENT_READONLY (1<<17)    /* Cluster client is in read-only state. */
#define CLIENT_PUBSUB (1<<18)      /* Client is in Pub/Sub mode. */
#define CLIENT_PREVENT_AOF_PROP (1<<19)  /* Don't propagate to AOF. */
#define CLIENT_PREVENT_REPL_PROP (1<<20)  /* Don't propagate to slaves. */
#define CLIENT_PREVENT_PROP (CLIENT_PREVENT_AOF_PROP|CLIENT_PREVENT_REPL_PROP)
#define CLIENT_PENDING_WRITE (1<<21) /* Client has output to send but a write
                                        handler is yet not installed. */
#define CLIENT_REPLY_OFF (1<<22)   /* Don't send replies to client. */
#define CLIENT_REPLY_SKIP_NEXT (1<<23)  /* Set CLIENT_REPLY_SKIP for next cmd */
#define CLIENT_REPLY_SKIP (1<<24)  /* Don't send just this reply. */
#define CLIENT_LUA_DEBUG (1<<25)  /* Run EVAL in debug mode. */
#define CLIENT_LUA_DEBUG_SYNC (1<<26)  /* EVAL debugging without fork() */
#define CLIENT_JUMP (1<<27)

#define REDIS_REPLY_CHUNK_BYTES (16*1024) /* 16k output buffer */

/* Client request types */
#define PROTO_REQ_INLINE 1
#define PROTO_REQ_MULTIBULK 2

/* Client classes for client limits, currently used only for
 * the max-client-output-buffer limit implementation. */
#define CLIENT_TYPE_NORMAL 0 /* Normal req-reply clients + MONITORs */
#define CLIENT_TYPE_SLAVE 1  /* Slaves. */
#define CLIENT_TYPE_PUBSUB 2 /* Clients subscribed to PubSub channels. */
#define CLIENT_TYPE_MASTER 3 /* Master. */
#define CLIENT_TYPE_OBUF_COUNT 3 /* Number of clients to expose to output
                                    buffer configuration. Just the first
                                    three: normal, slave, pubsub. */

/* Client block type (btype field in client structure)
 * if CLIENT_BLOCKED flag is set. */
#define BLOCKED_NONE 0    /* Not blocked, no CLIENT_BLOCKED flag set. */
#define BLOCKED_LIST 1    /* BLPOP & co. */
#define BLOCKED_WAIT 2    /* WAIT for synchronous replication. */

/* With multiplexing we need to take per-client state.
 * Clients are taken in a linked list. */
typedef struct client {
    uint64_t id;            /* Client incremental unique ID. */
    
    struct conn *conn;
    vr_eventloop *vel;
    
    redisDb *db;            /* Pointer to currently dispatch DB. */
    int dictid;             /* ID of the currently SELECTed DB. */
    int scanid;             /* Internal ID of the currently DB for scan */
    robj *name;             /* As set by CLIENT SETNAME. */
    sds querybuf;           /* Buffer we use to accumulate client queries. */
    size_t querybuf_peak;   /* Recent (100ms or more) peak of querybuf size. */
    int argc;               /* Num of arguments of current command. */
    robj **argv;            /* Arguments of current command. */
    struct redisCommand *cmd, *lastcmd;  /* Last command executed. */
    int reqtype;            /* Request protocol type: PROTO_REQ_* */
    int multibulklen;       /* Number of multi bulk arguments left to read. */
    long bulklen;           /* Length of bulk argument in multi bulk request. */
    dlist *reply;            /* List of reply objects to send to the client. */
    unsigned long long reply_bytes; /* Tot bytes of objects in reply list. */
    size_t sentlen;         /* Amount of bytes already sent in the current
                               buffer or object being sent. */
    time_t ctime;           /* Client creation time. */
    time_t lastinteraction; /* Time of the last interaction, used for timeout */
    time_t obuf_soft_limit_reached_time;
    int flags;              /* Client flags: CLIENT_* macros. */
    int authenticated;      /* When requirepass(1) or adminpass(2) is non-NULL. */
    int replstate;          /* Replication state if this is a slave. */
    int repl_put_online_on_ack; /* Install slave write handler on ACK. */
    int repldbfd;           /* Replication DB file descriptor. */
    off_t repldboff;        /* Replication DB file offset. */
    off_t repldbsize;       /* Replication DB file size. */
    sds replpreamble;       /* Replication DB preamble. */
    long long reploff;      /* Replication offset if this is our master. */
    long long repl_ack_off; /* Replication ack offset, if this is a slave. */
    long long repl_ack_time;/* Replication ack time, if this is a slave. */
    long long psync_initial_offset; /* FULLRESYNC reply offset other slaves
                                       copying this slave output buffer
                                       should use. */
    char replrunid[CONFIG_RUN_ID_SIZE+1]; /* Master run id if is a master. */
    int slave_listening_port; /* As configured with: SLAVECONF listening-port */
    int slave_capa;         /* Slave capabilities: SLAVE_CAPA_* bitwise OR. */
    multiState mstate;      /* MULTI/EXEC state */
    int btype;              /* Type of blocking op if CLIENT_BLOCKED. */
    blockingState bpop;     /* blocking state */
    long long woff;         /* Last write global replication offset. */
    dlist *watched_keys;     /* Keys WATCHED for MULTI/EXEC CAS */
    dict *pubsub_channels;  /* channels a client is interested in (SUBSCRIBE) */
    dlist *pubsub_patterns;  /* patterns a client is interested in (SUBSCRIBE) */
    sds peerid;             /* Cached peer ID. */

    int curidx;             /* The worker idx that this client current belong to. */
    int taridx;             /* The target worker idx that this client will jump to */
    int steps;              /* The steps that this client jumps between workers. */
    void *cache;            /* Cache data for client to jump between workers. */

    /* Response buffer */
    int bufpos;
    char buf[PROTO_REPLY_CHUNK_BYTES];
} client;

typedef struct clientBufferLimitsConfig {
    unsigned long long hard_limit_bytes;
    unsigned long long soft_limit_bytes;
    time_t soft_limit_seconds;
} clientBufferLimitsConfig;

/* networking.c -- Networking and Client related operations */
client *createClient(vr_eventloop *vel, struct conn *conn);
void closeTimedoutClients(void);
void freeClient(client *c);
void freeClientAsync(client *c);
void resetClient(client *c);
void sendReplyToClient(aeEventLoop *el, int fd, void *privdata, int mask);
void *addDeferredMultiBulkLength(client *c);
void setDeferredMultiBulkLength(client *c, void *node, long length);
void processInputBuffer(client *c);
void readQueryFromClient(aeEventLoop *el, int fd, void *privdata, int mask);
void addReplyBulk(client *c, robj *obj);
void addReplyBulkCString(client *c, const char *s);
void addReplyBulkCBuffer(client *c, const void *p, size_t len);
void addReplyBulkLongLong(client *c, long long ll);
void addReply(client *c, robj *obj);
void addReplySds(client *c, sds s);
void addReplyString(client *c, const char *s, size_t len);
void addReplyErrorLength(client *c, const char *s, size_t len);
void addReplyBulkSds(client *c, sds s);
void addReplyError(client *c, const char *err);
void addReplyStatusLength(client *c, const char *s, size_t len);
void addReplyStatus(client *c, const char *status);
void addReplyDouble(client *c, double d);
void addReplyHumanLongDouble(client *c, long double d);
void addReplyLongLong(client *c, long long ll);
void addReplyMultiBulkLen(client *c, long length);
void copyClientOutputBuffer(client *dst, client *src);
void *dupClientReplyValue(void *o);
void freeClientReplyValue(void *o);
void getClientsMaxBuffers(vr_eventloop *vel, unsigned long *longest_output_list,
                          unsigned long *biggest_input_buffer);
char *getClientPeerId(client *client);
sds catClientInfoString(sds s, client *client);
sds getAllClientsInfoString(vr_eventloop *vel);
void clientCommand(client *c);
void rewriteClientCommandVector(client *c, int argc, ...);
void rewriteClientCommandArgument(client *c, int i, robj *newval);
void replaceClientCommandVector(client *c, int argc, robj **argv);
unsigned long getClientOutputBufferMemoryUsage(client *c);
void freeClientsInAsyncFreeQueue(vr_eventloop *vel);
void asyncCloseClientOnOutputBufferLimitReached(client *c);
int getClientType(client *c);
int getClientTypeByName(char *name);
char *getClientTypeName(int class);
void flushSlavesOutputBuffers(void);
void disconnectSlaves(void);
int listenToPort(int port, int *fds, int *count);
void pauseClients(vr_eventloop *vel, long long duration);
int clientsArePaused(vr_eventloop *vel);
int processEventsWhileBlocked(vr_eventloop *vel);
int handleClientsWithPendingWrites(vr_eventloop *vel);
int clientHasPendingReplies(client *c);
void unlinkClientFromEventloop(client *c);
void linkClientToEventloop(client *c,vr_eventloop *vel);
void unlinkClient(client *c);
int writeToClient(int fd, client *c, int handler_installed);

#ifdef __GNUC__
void addReplyErrorFormat(client *c, const char *fmt, ...)
    __attribute__((format(printf, 2, 3)));
void addReplyStatusFormat(client *c, const char *fmt, ...)
    __attribute__((format(printf, 2, 3)));
#else
void addReplyErrorFormat(client *c, const char *fmt, ...);
void addReplyStatusFormat(client *c, const char *fmt, ...);
#endif

extern int ncurr_cconn;

#if defined(__ATOMIC_RELAXED)
#define update_curr_clients_add(__n) __atomic_add_fetch(&ncurr_cconn, (__n), __ATOMIC_RELAXED)
#define update_curr_clients_sub(__n) __atomic_sub_fetch(&ncurr_cconn, (__n), __ATOMIC_RELAXED)
#elif defined(HAVE_ATOMIC)
#define update_curr_clients_add(__n) __sync_add_and_fetch(&ncurr_cconn, (__n))
#define update_curr_clients_sub(__n) __sync_sub_and_fetch(&ncurr_cconn, (__n))
#else
pthread_mutex_t curr_clients_mutex = PTHREAD_MUTEX_INITIALIZER;

#define update_curr_clients_add(__n) do {       \
    pthread_mutex_lock(&curr_clients_mutex);    \
    ncurr_cconn += (__n);                       \
    pthread_mutex_unlock(&curr_clients_mutex);  \
} while(0)

#define update_curr_clients_sub(__n) do {       \
    pthread_mutex_lock(&curr_clients_mutex);    \
    ncurr_cconn -= (__n);                       \
    pthread_mutex_unlock(&curr_clients_mutex);  \
} while(0)
#endif

int current_clients(void);

#endif


================================================
FILE: src/vr_command.c
================================================
#include <vr_core.h>

/* Command table. sds string -> command struct pointer. */
dictType commandTableDictType = {
    dictSdsCaseHash,           /* hash function */
    NULL,                      /* key dup */
    NULL,                      /* val dup */
    dictSdsKeyCaseCompare,     /* key compare */
    dictSdsDestructor,         /* key destructor */
    NULL                       /* val destructor */
};

/* Our command table.
 *
 * Every entry is composed of the following fields:
 *
 * name: a string representing the command name.
 * function: pointer to the C function implementing the command.
 * arity: number of arguments, it is possible to use -N to say >= N
 * sflags: command flags as string. See below for a table of flags.
 * flags: flags as bitmask. Computed by Redis using the 'sflags' field.
 * get_keys_proc: an optional function to get key arguments from a command.
 *                This is only used when the following three fields are not
 *                enough to specify what arguments are keys.
 * first_key_index: first argument that is a key
 * last_key_index: last argument that is a key
 * key_step: step to get all the keys from first to last argument. For instance
 *           in MSET the step is two since arguments are key,val,key,val,...
 * microseconds: microseconds of total execution time for this command.
 * calls: total number of calls of this command.
 *
 * The flags, microseconds and calls fields are computed by Redis and should
 * always be set to zero.
 *
 * Command flags are expressed using strings where every character represents
 * a flag. Later the populateCommandTable() function will take care of
 * populating the real 'flags' field using this characters.
 *
 * This is the meaning of the flags:
 *
 * w: write command (may modify the key space).
 * r: read command  (will never modify the key space).
 * m: may increase memory usage once called. Don't allow if out of memory.
 * a: admin command, like SAVE or SHUTDOWN.
 * p: Pub/Sub related command.
 * f: force replication of this command, regardless of server.dirty.
 * s: command not allowed in scripts.
 * R: random command. Command is not deterministic, that is, the same command
 *    with the same arguments, with the same key space, may have different
 *    results. For instance SPOP and RANDOMKEY are two random commands.
 * S: Sort command output array if called from script, so that the output
 *    is deterministic.
 * l: Allow command while loading the database.
 * t: Allow command while a slave has stale data but is not allowed to
 *    server this data. Normally no command is accepted in this condition
 *    but just a few.
 * M: Do not automatically propagate the command on MONITOR.
 * k: Perform an implicit ASKING for this command, so the command will be
 *    accepted in cluster mode if the slot is marked as 'importing'.
 * F: Fast command: O(1) or O(log(N)) command that should never delay
 *    its execution as long as the kernel scheduler is giving us time.
 *    Note that commands that may trigger a DEL as a side effect (like SET)
 *    are not fast commands.
 */
struct redisCommand redisCommandTable[] = {
    /*Connectong*/
    {"ping",pingCommand,-1,"tF",0,NULL,0,0,0,0,0},
    {"echo",echoCommand,2,"F",0,NULL,0,0,0,0,0},
    {"select",selectCommand,2,"lF",0,NULL,0,0,0,0,0},
    {"auth",authCommand,2,"sltF",0,NULL,0,0,0,0,0},
    {"admin",adminCommand,2,"sltF",0,NULL,0,0,0,0,0},
    /* Server */
    {"info",infoCommand,-1,"lt",0,NULL,0,0,0,0,0},
    {"flushdb",flushdbCommand,1,"w",0,NULL,0,0,0,0,0},
    {"flushall",flushallCommand,1,"w",0,NULL,0,0,0,0,0},
    {"time",timeCommand,1,"RF",0,NULL,0,0,0,0,0},
    {"dbsize",dbsizeCommand,1,"rF",0,NULL,0,0,0,0,0},
    {"command",commandCommand,0,"lt",0,NULL,0,0,0,0,0},
    {"config",configCommand,-2,"lat",0,NULL,0,0,0,0,0},
    {"client",clientCommand,-2,"as",0,NULL,0,0,0,0,0},
    {"slowlog",slowlogCommand,-2,"a",0,NULL,0,0,0,0,0},
    /* Key */
    {"del",delCommand,-2,"w",0,NULL,1,-1,1,0,0},
    {"exists",existsCommand,-2,"rF",0,NULL,1,-1,1,0,0},
    {"ttl",ttlCommand,2,"rF",0,NULL,1,1,1,0,0},
    {"pttl",pttlCommand,2,"rF",0,NULL,1,1,1,0,0},
    {"expire",expireCommand,3,"wF",0,NULL,1,1,1,0,0},
    {"expireat",expireatCommand,3,"wF",0,NULL,1,1,1,0,0},
    {"pexpire",pexpireCommand,3,"wF",0,NULL,1,1,1,0,0},
    {"pexpireat",pexpireatCommand,3,"wF",0,NULL,1,1,1,0,0},
    {"persist",persistCommand,2,"wF",0,NULL,1,1,1,0,0},
    {"randomkey",randomkeyCommand,1,"rR",0,NULL,0,0,0,0,0},
    {"type",typeCommand,2,"rF",0,NULL,1,1,1,0,0},
    {"keys",keysCommand,2,"rS",0,NULL,0,0,0,0,0},
    {"scan",scanCommand,-2,"rR",0,NULL,0,0,0,0,0},
    {"object",objectCommand,3,"r",0,NULL,2,2,2,0,0},
    /* String */
    {"get",getCommand,2,"rF",0,NULL,1,1,1,0,0},
    {"set",setCommand,-3,"wm",0,NULL,1,1,1,0,0},
    {"setnx",setnxCommand,3,"wmF",0,NULL,1,1,1,0,0},
    {"setex",setexCommand,4,"wm",0,NULL,1,1,1,0,0},
    {"psetex",psetexCommand,4,"wm",0,NULL,1,1,1,0,0},
    {"incr",incrCommand,2,"wmF",0,NULL,1,1,1,0,0},
    {"decr",decrCommand,2,"wmF",0,NULL,1,1,1,0,0},
    {"incrby",incrbyCommand,3,"wmF",0,NULL,1,1,1,0,0},
    {"decrby",decrbyCommand,3,"wmF",0,NULL,1,1,1,0,0},
    {"append",appendCommand,3,"wm",0,NULL,1,1,1,0,0},
    {"strlen",strlenCommand,2,"rF",0,NULL,1,1,1,0,0},
    {"getset",getsetCommand,3,"wm",0,NULL,1,1,1,0,0},
    {"incrbyfloat",incrbyfloatCommand,3,"wmF",0,NULL,1,1,1,0,0},
    {"setbit",setbitCommand,4,"wm",0,NULL,1,1,1,0,0},
    {"getbit",getbitCommand,3,"rF",0,NULL,1,1,1,0,0},
    {"setrange",setrangeCommand,4,"wm",0,NULL,1,1,1,0,0},
    {"getrange",getrangeCommand,4,"r",0,NULL,1,1,1,0,0},
    {"bitcount",bitcountCommand,-2,"r",0,NULL,1,1,1,0,0},
    {"bitpos",bitposCommand,-3,"r",0,NULL,1,1,1,0,0},
    {"mget",mgetCommand,-2,"r",0,NULL,1,-1,1,0,0},
    {"mset",msetCommand,-3,"wm",0,NULL,1,-1,2,0,0},
    /* Hash */
    {"hset",hsetCommand,4,"wmF",0,NULL,1,1,1,0,0},
    {"hget",hgetCommand,3,"rF",0,NULL,1,1,1,0,0},
    {"hlen",hlenCommand,2,"rF",0,NULL,1,1,1,0,0},
    {"hdel",hdelCommand,-3,"wF",0,NULL,1,1,1,0,0},
    {"hexists",hexistsCommand,3,"rF",0,NULL,1,1,1,0,0},
    {"hkeys",hkeysCommand,2,"rS",0,NULL,1,1,1,0,0},
    {"hvals",hvalsCommand,2,"rS",0,NULL,1,1,1,0,0},
    {"hgetall",hgetallCommand,2,"r",0,NULL,1,1,1,0,0},
    {"hincrby",hincrbyCommand,4,"wmF",0,NULL,1,1,1,0,0},
    {"hincrbyfloat",hincrbyfloatCommand,4,"wmF",0,NULL,1,1,1,0,0},
    {"hmget",hmgetCommand,-3,"r",0,NULL,1,1,1,0,0},
    {"hmset",hmsetCommand,-4,"wm",0,NULL,1,1,1,0,0},
    {"hsetnx",hsetnxCommand,4,"wmF",0,NULL,1,1,1,0,0},
    {"hstrlen",hstrlenCommand,3,"rF",0,NULL,1,1,1,0,0},
    {"hscan",hscanCommand,-3,"rR",0,NULL,1,1,1,0,0},
    /* List */
    {"rpush",rpushCommand,-3,"wmF",0,NULL,1,1,1,0,0},
    {"lpush",lpushCommand,-3,"wmF",0,NULL,1,1,1,0,0},
    {"lrange",lrangeCommand,4,"r",0,NULL,1,1,1,0,0},
    {"rpop",rpopCommand,2,"wF",0,NULL,1,1,1,0,0},
    {"lpop",lpopCommand,2,"wF",0,NULL,1,1,1,0,0},
    {"llen",llenCommand,2,"rF",0,NULL,1,1,1,0,0},
    {"lrem",lremCommand,4,"w",0,NULL,1,1,1,0,0},
    {"ltrim",ltrimCommand,4,"w",0,NULL,1,1,1,0,0},
    {"lindex",lindexCommand,3,"r",0,NULL,1,1,1,0,0},
    {"lset",lsetCommand,4,"wm",0,NULL,1,1,1,0,0},
    /* Set */
    {"sadd",saddCommand,-3,"wmF",0,NULL,1,1,1,0,0},
    {"smembers",smembersCommand,2,"rS",0,NULL,1,1,1,0,0},
    {"scard",scardCommand,2,"rF",0,NULL,1,1,1,0,0},
    {"srem",sremCommand,-3,"wF",0,NULL,1,1,1,0,0},
    {"spop",spopCommand,-2,"wRsF",0,NULL,1,1,1,0,0},
    {"sismember",sismemberCommand,3,"rF",0,NULL,1,1,1,0,0},
    {"sscan",sscanCommand,-3,"rR",0,NULL,1,1,1,0,0},
    {"sunion",sunionCommand,-2,"rS",0,NULL,1,-1,1,0,0},
    {"sunionstore",sunionstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
    {"sdiff",sdiffCommand,-2,"rS",0,NULL,1,-1,1,0,0},
    {"sdiffstore",sdiffstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
    {"sinter",sinterCommand,-2,"rS",0,NULL,1,-1,1,0,0},
    {"sinterstore",sinterstoreCommand,-3,"wm",0,NULL,1,-1,1,0,0},
    /* SortedSet */
    {"zadd",zaddCommand,-4,"wmF",0,NULL,1,1,1,0,0},
    {"zincrby",zincrbyCommand,4,"wmF",0,NULL,1,1,1,0,0},
    {"zrange",zrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
    {"zrevrange",zrevrangeCommand,-4,"r",0,NULL,1,1,1,0,0},
    {"zrem",zremCommand,-3,"wF",0,NULL,1,1,1,0,0},
    {"zcard",zcardCommand,2,"rF",0,NULL,1,1,1,0,0},
    {"zcount",zcountCommand,4,"rF",0,NULL,1,1,1,0,0},
    {"zrangebyscore",zrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
    {"zrevrangebyscore",zrevrangebyscoreCommand,-4,"r",0,NULL,1,1,1,0,0},
    {"zrank",zrankCommand,3,"rF",0,NULL,1,1,1,0,0},
    {"zrevrank",zrevrankCommand,3,"rF",0,NULL,1,1,1,0,0},
    {"zscore",zscoreCommand,3,"rF",0,NULL,1,1,1,0,0},
    {"zremrangebyscore",zremrangebyscoreCommand,4,"w",0,NULL,1,1,1,0,0},
    {"zremrangebyrank",zremrangebyrankCommand,4,"w",0,NULL,1,1,1,0,0},
    {"zremrangebylex",zremrangebylexCommand,4,"w",0,NULL,1,1,1,0,0},
    {"zscan",zscanCommand,-3,"rR",0,NULL,1,1,1,0,0},
    /* HyperLogLog */
    {"pfadd",pfaddCommand,-2,"wmF",0,NULL,1,1,1,0,0},
    {"pfcount",pfcountCommand,-2,"r",0,NULL,1,-1,1,0,0}
};

/* Populates the Redis Command Table starting from the hard coded list
 * we have on top of redis.c file. */
void populateCommandTable(void) {
    int j;
    int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);

    for (j = 0; j < numcommands; j++) {
        struct redisCommand *c = redisCommandTable+j;
        char *f = c->sflags;
        int retval1;

        while(*f != '\0') {
            switch(*f) {
            case 'w': c->flags |= CMD_WRITE; break;
            case 'r': c->flags |= CMD_READONLY; break;
            case 'm': c->flags |= CMD_DENYOOM; break;
            case 'a': c->flags |= CMD_ADMIN; break;
            case 'p': c->flags |= CMD_PUBSUB; break;
            case 's': c->flags |= CMD_NOSCRIPT; break;
            case 'R': c->flags |= CMD_RANDOM; break;
            case 'S': c->flags |= CMD_SORT_FOR_SCRIPT; break;
            case 'l': c->flags |= CMD_LOADING; break;
            case 't': c->flags |= CMD_STALE; break;
            case 'M': c->flags |= CMD_SKIP_MONITOR; break;
            case 'k': c->flags |= CMD_ASKING; break;
            case 'F': c->flags |= CMD_FAST; break;
            default: serverPanic("Unsupported command flag"); break;
            }
            f++;
        }

        retval1 = dictAdd(server.commands, sdsnew(c->name), c);
        ASSERT(retval1 == DICT_OK);

        c->idx = j;
    }
}

int populateCommandsNeedAdminpass(void) {
    struct darray commands_need_adminpass;
    sds *command_name;
    struct redisCommand *command;

    darray_init(&commands_need_adminpass,1,sizeof(sds));
    conf_server_get(CONFIG_SOPN_COMMANDSNAP,&commands_need_adminpass);
    while (darray_n(&commands_need_adminpass)) {
        command_name = darray_pop(&commands_need_adminpass);
        command = lookupCommand(*command_name);
        if (command == NULL) {
            log_error("Unknow command %s for commands-need-amdminpass",
                command_name);
            return VR_ERROR;
        }
        command->needadmin = 1;
        sdsfree(*command_name);
    }
    darray_deinit(&commands_need_adminpass);

    return VR_OK;
}

struct redisCommand *lookupCommand(sds name) {
    return dictFetchValue(server.commands, name);
}

/* Lookup the command in the current table, if not found also check in
 * the original table containing the original command names unaffected by
 * redis.conf rename-command statement.
 *
 * This is used by functions rewriting the argument vector such as
 * rewriteClientCommandVector() in order to set client->cmd pointer
 * correctly even if the command was renamed. */
struct redisCommand *lookupCommandOrOriginal(sds name) {
    struct redisCommand *cmd = dictFetchValue(server.commands, name);

    if (!cmd) cmd = dictFetchValue(server.orig_commands,name);
    return cmd;
}

struct redisCommand *lookupCommandByCString(char *s) {
    struct redisCommand *cmd;
    sds name = sdsnew(s);

    cmd = dictFetchValue(server.commands, name);
    sdsfree(name);
    return cmd;
}


/* Call() is the core of Redis execution of a command.
 *
 * The following flags can be passed:
 * CMD_CALL_NONE        No flags.
 * CMD_CALL_SLOWLOG     Check command speed and log in the slow log if needed.
 * CMD_CALL_STATS       Populate command stats.
 * CMD_CALL_PROPAGATE_AOF   Append command to AOF if it modified the dataset
 *                          or if the client flags are forcing propagation.
 * CMD_CALL_PROPAGATE_REPL  Send command to salves if it modified the dataset
 *                          or if the client flags are forcing propagation.
 * CMD_CALL_PROPAGATE   Alias for PROPAGATE_AOF|PROPAGATE_REPL.
 * CMD_CALL_FULL        Alias for SLOWLOG|STATS|PROPAGATE.
 *
 * The exact propagation behavior depends on the client flags.
 * Specifically:
 *
 * 1. If the client flags CLIENT_FORCE_AOF or CLIENT_FORCE_REPL are set
 *    and assuming the corresponding CMD_CALL_PROPAGATE_AOF/REPL is set
 *    in the call flags, then the command is propagated even if the
 *    dataset was not affected by the command.
 * 2. If the client flags CLIENT_PREVENT_REPL_PROP or CLIENT_PREVENT_AOF_PROP
 *    are set, the propagation into AOF or to slaves is not performed even
 *    if the command modified the dataset.
 *
 * Note that regardless of the client flags, if CMD_CALL_PROPAGATE_AOF
 * or CMD_CALL_PROPAGATE_REPL are not set, then respectively AOF or
 * slaves propagation will never occur.
 *
 * Client flags are modified by the implementation of a given command
 * using the following API:
 *
 * forceCommandPropagation(client *c, int flags);
 * preventCommandPropagation(client *c);
 * preventCommandAOF(client *c);
 * preventCommandReplication(client *c);
 *
 */
void call(client *c, int flags) {
    long long dirty, start, duration;
    int client_old_flags = c->flags;

    /* Sent the command to clients in MONITOR mode, only if the commands are
     * not generated from reading an AOF. */
    if (dlistLength(server.monitors) &&
        !server.loading &&
        !(c->cmd->flags & (CMD_SKIP_MONITOR|CMD_ADMIN)))
    {
        replicationFeedMonitors(c,server.monitors,c->db->id,c->argv,c->argc);
    }

    /* Initialization: clear the flags that must be set by the command on
     * demand, and initialize the array for additional commands propagation. */
    c->flags &= ~(CLIENT_FORCE_AOF|CLIENT_FORCE_REPL|CLIENT_PREVENT_PROP);
    redisOpArrayInit(&server.also_propagate);

    /* Call the command. */
    dirty = c->vel->dirty;
    start = vr_usec_now();
    c->cmd->proc(c);
    duration = vr_usec_now()-start;
    dirty = c->vel->dirty-dirty;
    if (dirty < 0) dirty = 0;

    /* When EVAL is called loading the AOF we don't want commands called
     * from Lua to go into the slowlog or to populate statistics. */
    if (server.loading && c->flags & CLIENT_LUA)
        flags &= ~(CMD_CALL_SLOWLOG | CMD_CALL_STATS);

    /* If the caller is Lua, we want to force the EVAL caller to propagate
     * the script if the command flag or client flag are forcing the
     * propagation. */
    if (c->flags & CLIENT_LUA && server.lua_caller) {
        if (c->flags & CLIENT_FORCE_REPL)
            server.lua_caller->flags |= CLIENT_FORCE_REPL;
        if (c->flags & CLIENT_FORCE_AOF)
            server.lua_caller->flags |= CLIENT_FORCE_AOF;
    }

    /* Log the command into the Slow log if needed, and populate the
     * per-command statistics that we show in INFO commandstats. */
    if (flags & CMD_CALL_SLOWLOG && c->cmd->proc != execCommand) {
        //char *latency_event = (c->cmd->flags & CMD_FAST) ?
        //                      "fast-command" : "command";
        //latencyAddSampleIfNeeded(latency_event,duration/1000);
        slowlogPushEntryIfNeeded(c->vel,c->argv,c->argc,duration);
    }
    if (flags & CMD_CALL_STATS) {
        commandStats *cstats = darray_get(c->vel->cstable,c->lastcmd->idx);
        cstats->microseconds += duration;
        cstats->calls++;
    }

    /* Propagate the command into the AOF and replication link */
    if (flags & CMD_CALL_PROPAGATE &&
        (c->flags & CLIENT_PREVENT_PROP) != CLIENT_PREVENT_PROP)
    {
        int propagate_flags = PROPAGATE_NONE;

        /* Check if the command operated changes in the data set. If so
         * set for replication / AOF propagation. */
        if (dirty) propagate_flags |= (PROPAGATE_AOF|PROPAGATE_REPL);

        /* If the client forced AOF / replication of the command, set
         * the flags regardless of the command effects on the data set. */
        if (c->flags & CLIENT_FORCE_REPL) propagate_flags |= PROPAGATE_REPL;
        if (c->flags & CLIENT_FORCE_AOF) propagate_flags |= PROPAGATE_AOF;

        /* However prevent AOF / replication propagation if the command
         * implementatino called preventCommandPropagation() or similar,
         * or if we don't have the call() flags to do so. */
        if (c->flags & CLIENT_PREVENT_REPL_PROP ||
            !(flags & CMD_CALL_PROPAGATE_REPL))
                propagate_flags &= ~PROPAGATE_REPL;
        if (c->flags & CLIENT_PREVENT_AOF_PROP ||
            !(flags & CMD_CALL_PROPAGATE_AOF))
                propagate_flags &= ~PROPAGATE_AOF;

        /* Call propagate() only if at least one of AOF / replication
         * propagation is needed. */
        if (propagate_flags != PROPAGATE_NONE)
            propagate(c->cmd,c->db->id,c->argv,c->argc,propagate_flags);
    }

    /* Restore the old replication flags, since call() can be executed
     * recursively. */
    c->flags &= ~(CLIENT_FORCE_AOF|CLIENT_FORCE_REPL|CLIENT_PREVENT_PROP);
    c->flags |= client_old_flags &
        (CLIENT_FORCE_AOF|CLIENT_FORCE_REPL|CLIENT_PREVENT_PROP);

    /* Handle the alsoPropagate() API to handle commands that want to propagate
     * multiple separated commands. Note that alsoPropagate() is not affected
     * by CLIENT_PREVENT_PROP flag. */
    if (server.also_propagate.numops) {
        int j;
        redisOp *rop;

        if (flags & CMD_CALL_PROPAGATE) {
            for (j = 0; j < server.also_propagate.numops; j++) {
                rop = &server.also_propagate.ops[j];
                int target = rop->target;
                /* Whatever the command wish is, we honor the call() flags. */
                if (!(flags&CMD_CALL_PROPAGATE_AOF)) target &= ~PROPAGATE_AOF;
                if (!(flags&CMD_CALL_PROPAGATE_REPL)) target &= ~PROPAGATE_REPL;
                if (target)
                    propagate(rop->cmd,rop->dbid,rop->argv,rop->argc,target);
            }
        }
        redisOpArrayFree(&server.also_propagate);
    }
    update_stats_add(c->vel->stats, numcommands, 1);
}

/* If this function gets called we already read a whole
 * command, arguments are in the client argv/argc fields.
 * processCommand() execute the command or prepare the
 * server for a bulk read from the client.
 *
 * If VR_OK is returned the client is still alive and valid and
 * other operations can be performed by the caller. Otherwise
 * if VR_ERROR is returned the client was destroyed (i.e. after QUIT). */
int processCommand(client *c) {
    long long maxmemory;

    /* The QUIT command is handled separately. Normal command procs will
     * go through checking for replication and QUIT will cause trouble
     * when FORCE_REPLICATION is enabled and would be implemented in
     * a regular command proc. */
    if (!strcasecmp(c->argv[0]->ptr,"quit")) {
        addReply(c,shared.ok);
        c->flags |= CLIENT_CLOSE_AFTER_REPLY;
        return VR_ERROR;
    }

    /* Now lookup the command and check ASAP about trivial error conditions
     * such as wrong arity, bad command name and so forth. */
    c->cmd = c->lastcmd = lookupCommand(c->argv[0]->ptr);
    if (!c->cmd) {
        flagTransaction(c);
        addReplyErrorFormat(c,"unknown command '%s'",
            (char*)c->argv[0]->ptr);
        return VR_OK;
    } else if ((c->cmd->arity > 0 && c->cmd->arity != c->argc) ||
               (c->argc < -c->cmd->arity)) {
        flagTransaction(c);
        addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
            c->cmd->name);
        return VR_OK;
    }

    /* Check if the user is authenticated */
    if (c->vel->cc.requirepass && !c->authenticated && 
        c->cmd->proc != authCommand && c->cmd->proc != adminCommand)
    {
        flagTransaction(c);
        addReply(c,shared.noautherr);
        return VR_OK;
    }

    if (c->cmd->needadmin && c->vel->cc.adminpass && 
        c->authenticated < 2 && c->cmd->proc != adminCommand)
    {
        flagTransaction(c);
        addReply(c,shared.noadminerr);
        return VR_OK;
    }

    /* Handle the maxmemory directive.
     *
     * First we try to free some memory if possible (if there are volatile
     * keys in the dataset). If there are not the only thing we can do
     * is returning an error. */
    maxmemory = c->vel->cc.maxmemory;
    if (maxmemory) {
        int retval = freeMemoryIfNeeded(c->vel);
        /* freeMemoryIfNeeded may flush slave output buffers. This may result
         * into a slave, that may be the active client, to be freed. */
        if (c->vel->current_client == NULL) return VR_ERROR;

        /* It was impossible to free enough memory, and the command the client
         * is trying to execute is denied during OOM conditions? Error. */
        if ((c->cmd->flags & CMD_DENYOOM) && retval == VR_ERROR) {
            flagTransaction(c);
            addReply(c, shared.oomerr);
            return VR_OK;
        }
    }

    /* Don't accept write commands if there are problems persisting on disk
     * and if this is a master instance. */
    if (((server.stop_writes_on_bgsave_err &&
          server.saveparamslen > 0 &&
          server.lastbgsave_status == VR_ERROR) ||
          server.aof_last_write_status == VR_ERROR) &&
        repl.masterhost == NULL &&
        (c->cmd->flags & CMD_WRITE ||
         c->cmd->proc == pingCommand))
    {
        flagTransaction(c);
        if (server.aof_last_write_status == VR_OK)
            addReply(c, shared.bgsaveerr);
        else
            addReplySds(c,
                sdscatprintf(sdsempty(),
                "-MISCONF Errors writing to the AOF file: %s\r\n",
                strerror(server.aof_last_write_errno)));
        return VR_OK;
    }

    /* Don't accept write commands if there are not enough good slaves and
     * user configured the min-slaves-to-write option. */
    if (repl.masterhost == NULL &&
        repl.repl_min_slaves_to_write &&
        repl.repl_min_slaves_max_lag &&
        c->cmd->flags & CMD_WRITE &&
        repl.repl_good_slaves_count < repl.repl_min_slaves_to_write)
    {
        flagTransaction(c);
        addReply(c, shared.noreplicaserr);
        return VR_OK;
    }

    /* Don't accept write commands if this is a read only slave. But
     * accept write commands if this is our master. */
    if (repl.masterhost && repl.repl_slave_ro &&
        !(c->flags & CLIENT_MASTER) &&
        c->cmd->flags & CMD_WRITE)
    {
        addReply(c, shared.roslaveerr);
        return VR_OK;
    }

    /* Only allow SUBSCRIBE and UNSUBSCRIBE in the context of Pub/Sub */
    if (c->flags & CLIENT_PUBSUB &&
        c->cmd->proc != pingCommand &&
        c->cmd->proc != subscribeCommand &&
        c->cmd->proc != unsubscribeCommand &&
        c->cmd->proc != psubscribeCommand &&
        c->cmd->proc != punsubscribeCommand) {
        addReplyError(c,"only (P)SUBSCRIBE / (P)UNSUBSCRIBE / PING / QUIT allowed in this context");
        return VR_OK;
    }

    /* Only allow INFO and SLAVEOF when slave-serve-stale-data is no and
     * we are a slave with a broken link with master. */
    if (repl.masterhost && repl.repl_state != REPL_STATE_CONNECTED &&
        repl.repl_serve_stale_data == 0 &&
        !(c->cmd->flags & CMD_STALE))
    {
        flagTransaction(c);
        addReply(c, shared.masterdownerr);
        return VR_OK;
    }

    /* Loading DB? Return an error if the command has not the
     * CMD_LOADING flag. */
    if (server.loading && !(c->cmd->flags & CMD_LOADING)) {
        addReply(c, shared.loadingerr);
        return VR_OK;
    }

    /* Lua script too slow? Only allow a limited number of commands. */
    if (server.lua_timedout &&
          c->cmd->proc != authCommand &&
          c->cmd->proc != replconfCommand &&
        !(c->cmd->proc == shutdownCommand &&
          c->argc == 2 &&
          tolower(((char*)c->argv[1]->ptr)[0]) == 'n') &&
        !(c->cmd->proc == scriptCommand &&
          c->argc == 2 &&
          tolower(((char*)c->argv[1]->ptr)[0]) == 'k'))
    {
        flagTransaction(c);
        addReply(c, shared.slowscripterr);
        return VR_OK;
    }

    /* Exec the command */
    if (c->flags & CLIENT_MULTI &&
        c->cmd->proc != execCommand && c->cmd->proc != discardCommand &&
        c->cmd->proc != multiCommand && c->cmd->proc != watchCommand)
    {
        queueMultiCommand(c);
        addReply(c,shared.queued);
    } else {
        call(c,CMD_CALL_FULL);
        c->woff = repl.master_repl_offset;
        if (dlistLength(server.ready_keys))
            handleClientsBlockedOnLists();
    }

    return VR_OK;
}

/* ========================== Redis OP Array API ============================ */

void redisOpArrayInit(redisOpArray *oa) {
    oa->ops = NULL;
    oa->numops = 0;
}

int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid,
                       robj **argv, int argc, int target)
{
    redisOp *op;

    oa->ops = drealloc(oa->ops,sizeof(redisOp)*((size_t)oa->numops+1));
    op = oa->ops+oa->numops;
    op->cmd = cmd;
    op->dbid = dbid;
    op->argv = argv;
    op->argc = argc;
    op->target = target;
    oa->numops++;
    return oa->numops;
}

void redisOpArrayFree(redisOpArray *oa) {
    while(oa->numops) {
        int j;
        redisOp *op;

        oa->numops--;
        op = oa->ops+oa->numops;
        for (j = 0; j < op->argc; j++)
            decrRefCount(op->argv[j]);
        dfree(op->argv);
    }
    dfree(oa->ops);
}

/* Propagate the specified command (in the context of the specified database id)
 * to AOF and Slaves.
 *
 * flags are an xor between:
 * + PROPAGATE_NONE (no propagation of command at all)
 * + PROPAGATE_AOF (propagate into the AOF file if is enabled)
 * + PROPAGATE_REPL (propagate into the replication link)
 *
 * This should not be used inside commands implementation. Use instead
 * alsoPropagate(), preventCommandPropagation(), forceCommandPropagation().
 */
void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
               int flags)
{
    if (server.aof_state != AOF_OFF && flags & PROPAGATE_AOF)
        feedAppendOnlyFile(cmd,dbid,argv,argc);
    if (flags & PROPAGATE_REPL)
        replicationFeedSlaves(repl.slaves,dbid,argv,argc);
}

/* Used inside commands to schedule the propagation of additional commands
 * after the current command is propagated to AOF / Replication.
 *
 * 'cmd' must be a pointer to the Redis command to replicate, dbid is the
 * database ID the command should be propagated into.
 * Arguments of the command to propagte are passed as an array of redis
 * objects pointers of len 'argc', using the 'argv' vector.
 *
 * The function does not take a reference to the passed 'argv' vector,
 * so it is up to the caller to release the passed argv (but it is usually
 * stack allocated).  The function autoamtically increments ref count of
 * passed objects, so the caller does not need to. */
void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc,
                   int target)
{
    robj **argvcopy;
    int j;

    if (server.loading) return; /* No propagation during loading. */

    argvcopy = dalloc(sizeof(robj*)*(size_t)argc);
    for (j = 0; j < argc; j++) {
        argvcopy[j] = dupStringObjectUnconstant(argv[j]);
    }
    redisOpArrayAppend(&server.also_propagate,cmd,dbid,argvcopy,argc,target);
}

/* It is possible to call the function forceCommandPropagation() inside a
 * Redis command implementation in order to to force the propagation of a
 * specific command execution into AOF / Replication. */
void forceCommandPropagation(client *c, int flags) {
    if (flags & PROPAGATE_REPL) c->flags |= CLIENT_FORCE_REPL;
    if (flags & PROPAGATE_AOF) c->flags |= CLIENT_FORCE_AOF;
}

/* Avoid that the executed command is propagated at all. This way we
 * are free to just propagate what we want using the alsoPropagate()
 * API. */
void preventCommandPropagation(client *c) {
    c->flags |= CLIENT_PREVENT_PROP;
}

/* AOF specific version of preventCommandPropagation(). */
void preventCommandAOF(client *c) {
    c->flags |= CLIENT_PREVENT_AOF_PROP;
}

/* Replication specific version of preventCommandPropagation(). */
void preventCommandReplication(client *c) {
    c->flags |= CLIENT_PREVENT_REPL_PROP;
}

/* Helper function for addReplyCommand() to output flags. */
static int addReplyCommandFlag(client *c, struct redisCommand *cmd, int f, char *reply) {
    if (cmd->flags & f) {
        addReplyStatus(c, reply);
        return 1;
    }
    return 0;
}

/* Output the representation of a Redis command. Used by the COMMAND command. */
static void addReplyCommand(client *c, struct redisCommand *cmd) {
    if (!cmd) {
        addReply(c, shared.nullbulk);
    } else {
        /* We are adding: command name, arg count, flags, first, last, offset */
        addReplyMultiBulkLen(c, 6);
        addReplyBulkCString(c, cmd->name);
        addReplyLongLong(c, cmd->arity);

        int flagcount = 0;
        void *flaglen = addDeferredMultiBulkLength(c);
        flagcount += addReplyCommandFlag(c,cmd,CMD_WRITE, "write");
        flagcount += addReplyCommandFlag(c,cmd,CMD_READONLY, "readonly");
        flagcount += addReplyCommandFlag(c,cmd,CMD_DENYOOM, "denyoom");
        flagcount += addReplyCommandFlag(c,cmd,CMD_ADMIN, "admin");
        flagcount += addReplyCommandFlag(c,cmd,CMD_PUBSUB, "pubsub");
        flagcount += addReplyCommandFlag(c,cmd,CMD_NOSCRIPT, "noscript");
        flagcount += addReplyCommandFlag(c,cmd,CMD_RANDOM, "random");
        flagcount += addReplyCommandFlag(c,cmd,CMD_SORT_FOR_SCRIPT,"sort_for_script");
        flagcount += addReplyCommandFlag(c,cmd,CMD_LOADING, "loading");
        flagcount += addReplyCommandFlag(c,cmd,CMD_STALE, "stale");
        flagcount += addReplyCommandFlag(c,cmd,CMD_SKIP_MONITOR, "skip_monitor");
        flagcount += addReplyCommandFlag(c,cmd,CMD_ASKING, "asking");
        flagcount += addReplyCommandFlag(c,cmd,CMD_FAST, "fast");
        if (cmd->getkeys_proc) {
            addReplyStatus(c, "movablekeys");
            flagcount += 1;
        }
        setDeferredMultiBulkLength(c, flaglen, flagcount);

        addReplyLongLong(c, cmd->firstkey);
        addReplyLongLong(c, cmd->lastkey);
        addReplyLongLong(c, cmd->keystep);
    }
}

/* COMMAND <subcommand> <args> */
void commandCommand(client *c) {
    if (c->argc == 1) {
        dictIterator *di;
        dictEntry *de;
        
        addReplyMultiBulkLen(c, dictSize(server.commands));
        di = dictGetIterator(server.commands);
        while ((de = dictNext(di)) != NULL) {
            addReplyCommand(c, dictGetVal(de));
        }
        dictReleaseIterator(di);
    } else if (!strcasecmp(c->argv[1]->ptr, "info")) {
        int i;
        addReplyMultiBulkLen(c, c->argc-2);
        for (i = 2; i < c->argc; i++) {
            addReplyCommand(c, dictFetchValue(server.commands, c->argv[i]->ptr));
        }
    } else if (!strcasecmp(c->argv[1]->ptr, "count") && c->argc == 2) {
        addReplyLongLong(c, dictSize(server.commands));
    } else if (!strcasecmp(c->argv[1]->ptr,"getkeys") && c->argc >= 3) {
        struct redisCommand *cmd = lookupCommand(c->argv[2]->ptr);
        int *keys, numkeys, j;

        if (!cmd) {
            addReplyErrorFormat(c,"Invalid command specified");
            return;
        } else if ((cmd->arity > 0 && cmd->arity != c->argc-2) ||
                   ((c->argc-2) < -cmd->arity))
        {
            addReplyError(c,"Invalid number of arguments specified for command");
            return;
        }

        keys = getKeysFromCommand(cmd,c->argv+2,c->argc-2,&numkeys);
        addReplyMultiBulkLen(c,numkeys);
        for (j = 0; j < numkeys; j++) addReplyBulk(c,c->argv[keys[j]+2]);
        getKeysFreeResult(keys);
    } else if (!strcasecmp(c->argv[1]->ptr, "stats") && c->argc == 2) {
        int j;
        struct darray *cstableall;
        struct array *cstable = c->vel->cstable;
        commandStats *cstats, *cstatsall;

        if (c->steps == 0) {
            cstableall = commandStatsTableCreate();
            if (!(c->flags&CLIENT_JUMP))
                c->flags |= CLIENT_JUMP;
            c->taridx = worker_get_next_idx(c->curidx);
            c->cache = cstableall;
        } else {
            cstableall = c->cache;
            c->taridx = worker_get_next_idx(c->curidx);
        }

        for (j = 0; j < darray_n(cstable); j ++) {
            cstats = darray_get(cstable, j);
            if (!cstats->calls) continue;
            
            cstatsall = darray_get(cstableall, j);
            cstatsall->microseconds += cstats->microseconds;
            cstatsall->calls += cstats->calls;
        }
        
        if (c->steps >= (darray_n(&workers) - 1)) {
            sds command_stats_info;
            void *replylen_node;
            long replylen = 0;
            
            c->steps = 0;
            c->taridx = -1;
            c->cache = NULL;
            c->flags &= ~CLIENT_JUMP;
            
            replylen_node = addDeferredMultiBulkLength(c);
            for (j = 0; j < darray_n(cstableall); j ++) {
                cstatsall = darray_get(cstableall, j);
                if (!cstatsall->calls) continue;
                
                command_stats_info = sdscatprintf(sdsempty(),
                    "%s:calls=%lld,usec=%lld,usec_per_call=%.2f",
                    cstatsall->name, cstatsall->calls, cstatsall->microseconds,
                    (float)cstatsall->microseconds/cstatsall->calls);
                addReplyBulkSds(c,command_stats_info);
                replylen ++;
            }

            setDeferredMultiBulkLength(c,replylen_node,replylen);
            
            commandStatsTableDestroy(cstableall);
        }
    } else {
        addReplyError(c, "Unknown subcommand or wrong number of arguments.");
        return;
    }
}

struct darray *
commandStatsTableCreate(void)
{
    int j;
    commandStats *cstats;
    struct darray *cstatstable;
    int numcommands = sizeof(redisCommandTable)/sizeof(struct redisCommand);
    

    cstatstable = darray_create(numcommands,sizeof(commandStats));
    if (cstatstable == NULL) return NULL;
    for (j = 0; j < numcommands; j ++) {
        struct redisCommand *c = redisCommandTable+j;
        cstats = darray_push(cstatstable);
        cstats->name = c->name;
        cstats->microseconds = 0;
        cstats->calls = 0;
        ASSERT(j == c->idx);
    }

    return cstatstable;
}

void
commandStatsTableDestroy(struct darray *cstatstable)
{
    cstatstable->nelem = 0;
    darray_destroy(cstatstable);
}


================================================
FILE: src/vr_command.h
================================================
#ifndef _VR_COMMAND_H_
#define _VR_COMMAND_H_

/* Command flags. Please check the command table defined in the redis.c file
 * for more information about the meaning of every flag. */
#define CMD_WRITE 1                   /* "w" flag */
#define CMD_READONLY 2                /* "r" flag */
#define CMD_DENYOOM 4                 /* "m" flag */
#define CMD_NOT_USED_1 8              /* no longer used flag */
#define CMD_ADMIN 16                  /* "a" flag */
#define CMD_PUBSUB 32                 /* "p" flag */
#define CMD_NOSCRIPT  64              /* "s" flag */
#define CMD_RANDOM 128                /* "R" flag */
#define CMD_SORT_FOR_SCRIPT 256       /* "S" flag */
#define CMD_LOADING 512               /* "l" flag */
#define CMD_STALE 1024                /* "t" flag */
#define CMD_SKIP_MONITOR 2048         /* "M" flag */
#define CMD_ASKING 4096               /* "k" flag */
#define CMD_FAST 8192                 /* "F" flag */

/* Command call flags, see call() function */
#define CMD_CALL_NONE 0
#define CMD_CALL_SLOWLOG (1<<0)
#define CMD_CALL_STATS (1<<1)
#define CMD_CALL_PROPAGATE_AOF (1<<2)
#define CMD_CALL_PROPAGATE_REPL (1<<3)
#define CMD_CALL_PROPAGATE (CMD_CALL_PROPAGATE_AOF|CMD_CALL_PROPAGATE_REPL)
#define CMD_CALL_FULL (CMD_CALL_SLOWLOG | CMD_CALL_STATS | CMD_CALL_PROPAGATE)

/* Command propagation flags, see propagate() function */
#define PROPAGATE_NONE 0
#define PROPAGATE_AOF 1
#define PROPAGATE_REPL 2

/* SHUTDOWN flags */
#define SHUTDOWN_NOFLAGS 0      /* No flags. */
#define SHUTDOWN_SAVE 1         /* Force SAVE on SHUTDOWN even if no save
                                   points are configured. */
#define SHUTDOWN_NOSAVE 2       /* Don't SAVE on SHUTDOWN. */

typedef void redisCommandProc(struct client *c);
typedef int *redisGetKeysProc(struct redisCommand *cmd, robj **argv, int argc, int *numkeys);
struct redisCommand {
    char *name;
    redisCommandProc *proc;
    int arity;
    char *sflags; /* Flags as string representation, one char per flag. */
    int flags;    /* The actual flags, obtained from the 'sflags' field. */
    /* Use a function to determine keys arguments in a command line.
     * Used for Redis Cluster redirect. */
    redisGetKeysProc *getkeys_proc;
    /* What keys should be loaded in background when calling this command? */
    int firstkey; /* The first argument that's a key (0 = no keys) */
    int lastkey;  /* The last argument that's a key */
    int keystep;  /* The step between first and last key */
    int idx;
    int needadmin;
};

typedef struct commandStats {
    char *name;
    long long microseconds;
    long long calls;
}commandStats;

/* The redisOp structure defines a Redis Operation, that is an instance of
 * a command with an argument vector, database ID, propagation target
 * (PROPAGATE_*), and command pointer.
 *
 * Currently only used to additionally propagate more commands to AOF/Replication
 * after the propagation of the executed command. */
typedef struct redisOp {
    robj **argv;
    int argc, dbid, target;
    struct redisCommand *cmd;
} redisOp;

/* Defines an array of Redis operations. There is an API to add to this
 * structure in a easy way.
 *
 * redisOpArrayInit();
 * redisOpArrayAppend();
 * redisOpArrayFree();
 */
typedef struct redisOpArray {
    redisOp *ops;
    int numops;
} redisOpArray;

extern dictType commandTableDictType;

void populateCommandTable(void);
int populateCommandsNeedAdminpass(void);

struct redisCommand *lookupCommand(sds name);
struct redisCommand *lookupCommandOrOriginal(sds name);
struct redisCommand *lookupCommandByCString(char *s);

void call(struct client *c, int flags);
int processCommand(struct client *c);

void redisOpArrayInit(redisOpArray *oa);
int redisOpArrayAppend(redisOpArray *oa, struct redisCommand *cmd, int dbid, robj **argv, int argc, int target);
void redisOpArrayFree(redisOpArray *oa);

void propagate(struct redisCommand *cmd, int dbid, robj **argv, int argc, int flags);
void alsoPropagate(struct redisCommand *cmd, int dbid, robj **argv, int argc, int target);
void forceCommandPropagation(struct client *c, int flags);
void preventCommandPropagation(struct client *c);
void preventCommandAOF(struct client *c);
void preventCommandReplication(struct client *c);

void commandCommand(struct client *c);

struct darray *commandStatsTableCreate(void);
void commandStatsTableDestroy(struct darray *cstatstable);

#endif


================================================
FILE: src/vr_conf.c
================================================
#include <fcntl.h>

#include <vr_core.h>

typedef const char *(*configEnumGetStrFun)(int type);

#define CONF_TOKEN_ORGANIZATION_START   "["
#define CONF_TOKEN_ORGANIZATION_END     "]"
#define CONF_TOKEN_KEY_VALUE_BETWEEN    ":"
#define CONF_TOKEN_ARRAY_START          "-"

#define CONF_ORGANIZATION_NAME_COMMAN   "common"
#define CONF_ORGANIZATION_NAME_SERVER   "server"

#define CONF_VALUE_YES                  "yes"
#define CONF_VALUE_NO                   "no"

#define CONF_MAX_LINE                   1024

#define CONF_TAG_DEFAULT_TYPE           GROUP_TYPE_SINGLE
#define CONF_TAG_DEFAULT_HASH           HASH_FNV1_64
#define CONF_TAG_DEFAULT_HASH_TAG       NULL
#define CONF_TAG_DEFAULT_DISTRIBUTION   "ketama"
#define CONF_TAG_DEFAULT_REDIS_AUTH     NULL
#define CONF_TAG_DEFAULT_REDIS_DB       0
#define CONF_TAG_DEFAULT_TIMEOUT        300
#define CONF_TAG_DEFAULT_SERVERS        "127.0.0.1:6379"
#define CONF_TAG_DEFAULT_LISTEN         "127.0.0.1:6380"
#define CONF_TAG_DEFAULT_MAXMEMORY      1073741824   // 1Gb
#define CONF_TAG_DEFAULT_THREADS        sysconf(_SC_NPROCESSORS_ONLN)
#define CONF_TAG_DEFAULT_NOREPLY        "false"
#define CONF_TAG_DEFAULT_RDB_DISKLESS   "false"

#define DEFINE_ACTION(_hash, _name) (char*)(#_name),
static char* hash_strings[] = {
    HASH_CODEC( DEFINE_ACTION )
    NULL
};
#undef DEFINE_ACTION

#define DEFINE_ACTION(_dist, _name) (char*)(#_name),
static char* dist_strings[] = {
    DIST_CODEC( DEFINE_ACTION )
    NULL
};
#undef DEFINE_ACTION

#define DEFINE_ACTION(_policy, _name) (char*)(#_name),
static char* evictpolicy_strings[] = {
    EVICTPOLICY_CODEC( DEFINE_ACTION )
    NULL
};
#undef DEFINE_ACTION

static conf_option conf_server_options[] = {
    { (char *)CONFIG_SOPN_DATABASES,
      CONF_FIELD_TYPE_INT, 1,
      conf_set_int_non_zero, conf_get_int,
      offsetof(conf_server, databases) },
    { (char *)CONFIG_SOPN_IDPDATABASE,
      CONF_FIELD_TYPE_INT, 1,
      conf_set_int_non_zero, conf_get_int,
      offsetof(conf_server, internal_dbs_per_databases) },
    { (char *)CONFIG_SOPN_MAXMEMORY,
      CONF_FIELD_TYPE_LONGLONG, 0,
      conf_set_maxmemory, conf_get_longlong,
      offsetof(conf_server, maxmemory) },
    { (char *)CONFIG_SOPN_MAXMEMORYP,
      CONF_FIELD_TYPE_INT, 0,
      conf_set_maxmemory_policy, conf_get_int,
      offsetof(conf_server, maxmemory_policy) },
    { (char *)CONFIG_SOPN_MAXMEMORYS,
      CONF_FIELD_TYPE_INT, 0,
      conf_set_int_non_zero, conf_get_int,
      offsetof(conf_server, maxmemory_samples) },
    { (char *)CONFIG_SOPN_MTCLIMIT,
      CONF_FIELD_TYPE_LONGLONG, 0,
      conf_set_longlong, conf_get_longlong,
      offsetof(conf_server, max_time_complexity_limit) },
    { (char *)CONFIG_SOPN_BIND,
      CONF_FIELD_TYPE_ARRAYSDS, 1,
      conf_set_array_sds, conf_get_array_sds,
      offsetof(conf_server, binds) },
    { (char *)CONFIG_SOPN_PORT,
      CONF_FIELD_TYPE_INT, 1,
      conf_set_int, conf_get_int,
      offsetof(conf_server, port) },
    { (char *)CONFIG_SOPN_THREADS,
      CONF_FIELD_TYPE_INT, 1,
      conf_set_int, conf_get_int,
      offsetof(conf_server, threads) },
    { (char *)CONFIG_SOPN_MAXCLIENTS,
      CONF_FIELD_TYPE_INT, 0,
      conf_set_int_non_zero, conf_get_int,
      offsetof(conf_server, maxclients) },
    { (char *)CONFIG_SOPN_SLOWLOGLST,
      CONF_FIELD_TYPE_LONGLONG, 0,
      conf_set_longlong, conf_get_longlong,
      offsetof(conf_server, slowlog_log_slower_than) },
    { (char *)CONFIG_SOPN_SLOWLOGML,
      CONF_FIELD_TYPE_INT, 0,
      conf_set_int, conf_get_int,
      offsetof(conf_server, slowlog_max_len) },
    { (char *)CONFIG_SOPN_REQUIREPASS,
      CONF_FIELD_TYPE_SDS, 0,
      conf_set_password, conf_get_sds,
      offsetof(conf_server, requirepass) },
    { (char *)CONFIG_SOPN_ADMINPASS,
      CONF_FIELD_TYPE_SDS, 0,
      conf_set_password, conf_get_sds,
      offsetof(conf_server, adminpass) },
    { (char *)CONFIG_SOPN_COMMANDSNAP,
      CONF_FIELD_TYPE_ARRAYSDS, 1,
      conf_set_commands_need_adminpass, conf_get_array_sds,
      offsetof(conf_server, commands_need_adminpass) },
    { NULL, NULL, 0 }
};

vr_conf *conf = NULL;
conf_server *cserver = NULL;

static void
conf_value_dump(conf_value *cv, int log_level)
{
    uint32_t i;
    conf_value **cv_sub;
    
    if(cv == NULL){
        return;
    }

    if(cv->type == CONF_VALUE_TYPE_STRING){
        log_debug(log_level, "%.*s", sdslen(cv->value), cv->value);
    }else if(cv->type == CONF_VALUE_TYPE_ARRAY){
        for(i = 0; i < darray_n(cv->value); i++){
            cv_sub = darray_get(cv->value, i);
            conf_value_dump(*cv_sub, log_level);
        }
    }else{
        NOT_REACHED();
    }
}

static void
conf_organization_dump(sds name, dict *org, int log_level)
{
    dictIterator *di;
    dictEntry *de;
    sds key;
    conf_value *cv;

    if(name == NULL || org == NULL){
        return;
    }

    log_debug(log_level, "[%.*s]", sdslen(name), name);
    
    di = dictGetIterator(org);

    while((de = dictNext(di)) != NULL){
        key = dictGetKey(de);
        cv = dictGetVal(de);

        if(cv->type == CONF_VALUE_TYPE_STRING){
            log_debug(log_level, "%.*s: %.*s", 
                sdslen(key), key,
                sdslen(cv->value), cv->value);
        }else if(cv->type == CONF_VALUE_TYPE_ARRAY){
            log_debug(log_level, "%.*s:",sdslen(key), key);
            conf_value_dump(cv, log_level);
        }else{
            NOT_REACHED();
        }
    }

    dictReleaseIterator(di);
}

static void
conf_organizations_dump(vr_conf *cf)
{
    dict *orgs, *org;
    dictIterator *di;
    dictEntry *de;
    sds name;
    int log_level = LOG_VERB;
    
    if(cf == NULL){
        return;
    }

    orgs = cf->organizations;
    if(orgs == NULL){
        log_debug(log_level, "organization is NULL");
        return;
    }
    
    di = dictGetIterator(orgs);

    while((de = dictNext(di)) != NULL){
        name = dictGetKey(de);
        org = dictGetVal(de);

        conf_organization_dump(name, org, log_level);
        log_debug(log_level, "");
    }

    dictReleaseIterator(di);
}

int
conf_set_maxmemory(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    conf_value *cv = data;
    long long value;
    long long *gt;
    int err;

    if(cv->type != CONF_VALUE_TYPE_STRING){
        log_error("conf pool %s in the conf file error", 
            opt->name);
        return VR_ERROR;
    }

    CONF_WLOCK();
    
    p = obj;
    gt = (long long *)(p + opt->offset);

    value = memtoll(cv->value, &err);
    if(err != 0 || value < 0){
        CONF_UNLOCK();
        log_error("value for the key %s in conf file is invalid", 
             opt->name);
        return VR_ERROR;
    }

    *gt = value;
    conf->version ++;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_set_maxmemory_policy(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    conf_value *cv = data;
    int *gt;
    char **policy;

    if(cv->type != CONF_VALUE_TYPE_STRING){
        log_error("conf server in the conf file is not a string");
        return VR_ERROR;
    }

    CONF_WLOCK();

    p = obj;
    gt = (int*)(p + opt->offset);

    for (policy = evictpolicy_strings; *policy; policy ++) {
        if (strcmp(cv->value, *policy) == 0) {
            *gt = policy - evictpolicy_strings;
            break;
        }
    }

    if (*policy == NULL) {
        CONF_UNLOCK();
        log_error("ERROR: Conf maxmemory policy '%s' is invalid", 
            cv->value);
        return VR_ERROR;
    }

    if (*gt == MAXMEMORY_VOLATILE_LRU || *gt == MAXMEMORY_ALLKEYS_LRU) {
        CONF_UNLOCK();
        log_error("ERROR: Conf maxmemory policy now is not support %s and %s", 
            evictpolicy_strings[MAXMEMORY_VOLATILE_LRU], 
            evictpolicy_strings[MAXMEMORY_ALLKEYS_LRU]);
        return VR_ERROR;
    }

    CONF_UNLOCK();
    return VR_OK;
}

int
conf_set_int_non_zero(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    conf_value *cv = data;
    int *gt;

    if(cv->type != CONF_VALUE_TYPE_STRING){
        log_error("conf pool %s in the conf file error", 
            opt->name);
        return VR_ERROR;
    }

    CONF_WLOCK();

    p = obj;
    gt = (int*)(p + opt->offset);

    if(!sdsIsNum(cv->value)){
        CONF_UNLOCK();
        log_error("value of the key %s in conf file is not a number", 
            opt->name);
        return VR_ERROR;
    }

    *gt = vr_atoi(cv->value, sdslen(cv->value));

    if (*gt < 0) {
        CONF_UNLOCK();
        log_error("value of the key %s in conf file is invalid", 
            opt->name);
        return VR_ERROR;
    } else if (*gt < 1) {
        CONF_UNLOCK();
        log_error("value of the key %s in conf file must be 1 or greater", 
            opt->name);
        return VR_ERROR;
    }
    conf->version ++;
    CONF_UNLOCK();
    return VR_OK;
}

/* The return data need to free by users. */
int
conf_get_sds(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    sds *str = data;
    sds *gt;

    if (data == NULL)
        return VR_ERROR;

    CONF_RLOCK();
    p = obj;
    gt = (sds*)(p + opt->offset);
    if (*gt == NULL) *str = NULL;
    else *str = sdsdup(*gt);
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_set_sds(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    conf_value *cv = data;
    sds *gt;

    if(cv->type != CONF_VALUE_TYPE_STRING){
        log_error("conf pool %s in the conf file is not a string", 
            opt->name);
        return VR_ERROR;
    }

    CONF_WLOCK();
    p = obj;
    gt = (sds*)(p + opt->offset);

    *gt = sdsnewlen(cv->value, sdslen(cv->value));
    conf->version ++;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_set_password(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    conf_value *cv = data;
    sds *gt;

    if(cv->type != CONF_VALUE_TYPE_STRING){
        log_error("Conf pool %s in the conf file is not a string", 
            opt->name);
        return VR_ERROR;
    } else if (sdslen(cv->value) > CONFIG_AUTHPASS_MAX_LEN) {
        log_error("Password is longer than CONFIG_AUTHPASS_MAX_LEN");
        return VR_ERROR;
    }

    CONF_WLOCK();
    p = obj;
    gt = (sds*)(p + opt->offset);

    if (*gt != NULL) sdsfree(*gt);
    if (sdslen(cv->value) == 0) *gt = NULL;
    else *gt = sdsnewlen(cv->value, sdslen(cv->value));
    conf->version ++;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_get_int(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    int *integer = data;
    int *gt;

    if (data == NULL) 
        return VR_ERROR;

    CONF_RLOCK();
    p = obj;
    gt = (int*)(p + opt->offset);
    *integer = *gt;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_set_int(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    conf_value *cv = data;
    int *gt;

    if(cv->type != CONF_VALUE_TYPE_STRING){
        log_error("conf pool %s in the conf file error", 
            opt->name);
        return VR_ERROR;
    }

    CONF_WLOCK();
    
    p = obj;
    gt = (int*)(p + opt->offset);

    if(!sdsIsNum(cv->value)){
        CONF_UNLOCK();
        log_error("value of the key %s in conf file is not a number", 
            opt->name);
        return VR_ERROR;
    }

    *gt = vr_atoi(cv->value, sdslen(cv->value));

    if (*gt < 0) {
        CONF_UNLOCK();
        log_error("value of the key %s in conf file is invalid", 
            opt->name);
        return VR_ERROR;
    }
    conf->version ++;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_get_longlong(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    long long *integer = data;
    long long *gt;

    if (data == NULL)
        return VR_ERROR;

    CONF_RLOCK();
    p = obj;
    gt = (long long*)(p + opt->offset);
    *integer = *gt;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_set_longlong(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    conf_value *cv = data;
    long long *gt;

    if(cv->type != CONF_VALUE_TYPE_STRING){
        log_error("conf pool %s in the conf file error", 
            opt->name);
        return VR_ERROR;
    }

    CONF_WLOCK();
    
    p = obj;
    gt = (long long*)(p + opt->offset);

    if (!string2ll(cv->value, sdslen(cv->value), gt)) {
        CONF_UNLOCK();
        log_error("value of the key %s in conf file is invalid", 
            opt->name);
        return VR_ERROR;
    }
    conf->version ++;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_set_yesorno(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    conf_value *cv = data;
    int *gt;

    if(cv->type != CONF_VALUE_TYPE_STRING){
        log_error("conf pool %s in the conf file error", 
            opt->name);
        return VR_ERROR;
    }

    CONF_WLOCK();
    
    p = obj;
    gt = (int*)(p + opt->offset);

    if(!strcasecmp(cv->value, CONF_VALUE_YES)){
        *gt = 1;
    }else if(!strcasecmp(cv->value, CONF_VALUE_NO)){
        *gt = 0;
    }else{
        CONF_UNLOCK();
        log_error("key %s in conf file must be %s or %s",
            opt->name, CONF_VALUE_YES, CONF_VALUE_NO);
        return VR_ERROR;
    }
    conf->version ++;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_set_array_sds(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    uint32_t j;
    conf_value **cv_sub, *cv = data;
    struct darray *gt;
    sds *str;

    if(cv->type != CONF_VALUE_TYPE_STRING && 
        cv->type != CONF_VALUE_TYPE_ARRAY){
        log_error("conf pool %s in the conf file is not a string or array", 
            opt->name);
        return VR_ERROR;
    } else if (cv->type == CONF_VALUE_TYPE_ARRAY) {
        cv_sub = darray_get(cv->value, j);
        if ((*cv_sub)->type != CONF_VALUE_TYPE_STRING) {
            log_error("conf pool %s in the conf file is not a string array", 
                opt->name);
            return VR_ERROR;            
        }
    }

    CONF_WLOCK();
    p = obj;
    gt = (struct darray*)(p + opt->offset);

    while (darray_n(gt) > 0) {
        str = darray_pop(gt);
        sdsfree(*str);
    }

    if (cv->type == CONF_VALUE_TYPE_STRING) {
        str = darray_push(gt);
        *str = sdsdup(cv->value);
    } else if (cv->type == CONF_VALUE_TYPE_ARRAY) {
        for (j = 0; j < darray_n(cv->value); j ++) {
            cv_sub = darray_get(cv->value, j);
            str = darray_push(gt);
            *str = sdsdup((*cv_sub)->value);
        }
    }
    conf->version ++;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_set_commands_need_adminpass(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    uint32_t j;
    conf_value **cv_sub, *cv = data;
    struct darray *gt;
    sds *str;

    if(cv->type != CONF_VALUE_TYPE_STRING && 
        cv->type != CONF_VALUE_TYPE_ARRAY){
        log_error("conf pool %s in the conf file is not a string or array", 
            opt->name);
        return VR_ERROR;
    } else if (cv->type == CONF_VALUE_TYPE_ARRAY) {
        cv_sub = darray_get(cv->value, j);
        if ((*cv_sub)->type != CONF_VALUE_TYPE_STRING) {
            log_error("conf pool %s in the conf file is not a string array", 
                opt->name);
            return VR_ERROR;            
        }
    }

    CONF_WLOCK();
    p = obj;
    gt = (struct darray*)(p + opt->offset);

    while (darray_n(gt) > 0) {
        str = darray_pop(gt);
        sdsfree(*str);
    }

    if (cv->type == CONF_VALUE_TYPE_STRING) {
        str = darray_push(gt);
        *str = sdsdup(cv->value);
    } else if (cv->type == CONF_VALUE_TYPE_ARRAY) {
        for (j = 0; j < darray_n(cv->value); j ++) {
            cv_sub = darray_get(cv->value, j);
            str = darray_push(gt);
            *str = sdsdup((*cv_sub)->value);
        }
    }
    conf->version ++;
    CONF_UNLOCK();
    return VR_OK;
}

int
conf_get_array_sds(void *obj, conf_option *opt, void *data)
{
    uint8_t *p;
    uint32_t j;
    struct darray *strs = data;
    struct array *gt;
    sds *str1, *str2;

    if (data == NULL) {
        return VR_ERROR;
    }

    CONF_RLOCK();
    p = obj;
    gt = (struct darray*)(p + opt->offset);

    ASSERT(darray_n(strs) == 0);

    for (j = 0; j < darray_n(gt); j ++) {
        str1 = darray_get(gt, j);
        str2 = darray_push(strs);
        *str2 = sdsdup(*str1);
    }
    
    CONF_UNLOCK();
    return VR_OK;
}

static void dictConfValueDestructor(void *privdata, void *val)
{
    DICT_NOTUSED(privdata);

    conf_value_destroy(val);
}

static void dictDestructor(void *privdata, void *val)
{
    DICT_NOTUSED(privdata);

    dictRelease(val);
}

static dictType OrganizationDictType = {
    dictSdsHash,                /* hash function */
    NULL,                       /* key dup */
    NULL,                       /* val dup */
    dictSdsKeyCompare,          /* key compare */
    dictSdsDestructor,          /* key destructor */
    dictDestructor              /* val destructor */
};

static dictType KeyValueDictType = {
    dictSdsHash,                /* hash function */
    NULL,                       /* key dup */
    NULL,                       /* val dup */
    dictSdsKeyCompare,          /* key compare */
    dictSdsDestructor,          /* key destructor */
    dictConfValueDestructor     /* val destructor */
};

static dictType ConfTableDictType = {
    dictStrCaseHash,            /* hash function */
    NULL,                       /* key dup */
    NULL,                       /* val dup */
    dictStrKeyCaseCompare,      /* key compare */
    NULL,                       /* key destructor */
    NULL                        /* val destructor */
};

conf_value *conf_value_create(int type)
{
    conf_value *cv;

    cv = dalloc(sizeof(*cv));
    if(cv == NULL){
        return NULL;
    }

    cv->type = type;
    cv->value = NULL;

    if(cv->type == CONF_VALUE_TYPE_ARRAY){
        cv->value = darray_create(3, sizeof(conf_value*));
        if(cv->value == NULL){
            dfree(cv);
            return NULL;
        }
    }

    return cv;
}

void conf_value_destroy(conf_value *cv)
{
    conf_value **cv_sub;
    
    if(cv == NULL){
        return;
    }
    
    if(cv->type == CONF_VALUE_TYPE_UNKNOW){
        dfree(cv);
        return;
    }else if(cv->type == CONF_VALUE_TYPE_STRING){
        if(cv->value != NULL){
            sdsfree(cv->value);
        }
    }else if(cv->type == CONF_VALUE_TYPE_ARRAY){
        if(cv->value != NULL){
            while(darray_n(cv->value) > 0){
                cv_sub = darray_pop(cv->value);
                conf_value_destroy(*cv_sub);
            }

            darray_destroy(cv->value);
        }
    }else{
        NOT_REACHED();
    }

    dfree(cv);
}

static int conf_server_init(conf_server *cs)
{
    if(cs == NULL){
        return VR_ERROR;
    }

    cs->ctable = dictCreate(&ConfTableDictType,NULL);

    cs->databases = CONF_UNSET_NUM;
    cs->internal_dbs_per_databases = CONF_UNSET_NUM;
    cs->max_time_complexity_limit = CONF_UNSET_NUM;
    cs->maxmemory = CONF_UNSET_NUM;
    cs->maxmemory_policy = CONF_UNSET_NUM;
    cs->maxmemory_samples = CONF_UNSET_NUM;
    cs->maxclients = CONF_UNSET_NUM;
    cs->threads = CONF_UNSET_NUM;
    darray_init(&cs->binds,1,sizeof(sds));
    cs->port = CONF_UNSET_NUM;
    cs->requirepass = CONF_UNSET_PTR;
    cs->adminpass = CONF_UNSET_PTR;
    cs->dir = CONF_UNSET_PTR;
    darray_init(&cs->commands_need_adminpass,1,sizeof(sds));

    return VR_OK;
}

static int conf_server_set_default(conf_server *cs)
{
    sds *str;
    conf_option *opt;

    if(cs == NULL){
        return VR_ERROR;
    }

    for (opt = conf_server_options; opt&&opt->name; opt++) {
        dictAdd(cs->ctable,opt->name,opt);
    }

    cs->databases = CONFIG_DEFAULT_LOGICAL_DBNUM;
    cs->internal_dbs_per_databases = CONFIG_DEFAULT_INTERNAL_DBNUM;
    cs->max_time_complexity_limit = CONFIG_DEFAULT_MAX_TIME_COMPLEXITY_LIMIT;
    cs->maxmemory = CONFIG_DEFAULT_MAXMEMORY;
    cs->maxmemory_policy = CONFIG_DEFAULT_MAXMEMORY_POLICY;
    cs->maxmemory_samples = CONFIG_DEFAULT_MAXMEMORY_SAMPLES;
    cs->maxclients = CONFIG_DEFAULT_MAX_CLIENTS;
    cs->threads = CONFIG_DEFAULT_THREADS_NUM;
    cs->slowlog_log_slower_than = CONFIG_DEFAULT_SLOWLOG_LOG_SLOWER_THAN;
    cs->slowlog_max_len = CONFIG_DEFAULT_SLOWLOG_MAX_LEN;
    cs->requirepass = CONF_UNSET_PTR;
    cs->adminpass = CONF_UNSET_PTR;

    while (darray_n(&cs->binds) > 0) {
        str = darray_pop(&cs->binds);
        sdsfree(*str);
    }
    str = darray_push(&cs->binds);
    *str = sdsnew(CONFIG_DEFAULT_HOST);
    
    cs->port = CONFIG_DEFAULT_SERVER_PORT;

    if (cs->dir != CONF_UNSET_PTR) {
        sdsfree(cs->dir);
    }
    cs->dir = sdsnew(CONFIG_DEFAULT_DATA_DIR);

    while (darray_n(&cs->commands_need_adminpass) > 0) {
        str = darray_pop(&cs->commands_need_adminpass);
        sdsfree(*str);
    }

    return VR_OK;
}

static void conf_server_deinit(conf_server *cs)
{
    sds *str;
    
    if(cs == NULL){
        return;
    }

    cs->databases = CONF_UNSET_NUM;
    cs->internal_dbs_per_databases = CONF_UNSET_NUM;
    cs->maxmemory = CONF_UNSET_NUM;
    cs->maxmemory_policy = CONF_UNSET_NUM;
    cs->maxmemory_samples = CONF_UNSET_NUM;
    cs->max_time_complexity_limit = CONF_UNSET_NUM;
    cs->maxclients = CONF_UNSET_NUM;
    cs->threads = CONF_UNSET_NUM;

    while (darray_n(&cs->binds) > 0) {
        str = darray_pop(&cs->binds);
        sdsfree(*str);
    }
    darray_deinit(&cs->binds);

    cs->port = CONF_UNSET_NUM;
    
    if (cs->dir != CONF_UNSET_PTR) {
        sdsfree(cs->dir);
        cs->dir = CONF_UNSET_PTR;    
    }

    if (cs->requirepass != CONF_UNSET_PTR) {
        sdsfree(cs->requirepass);
        cs->requirepass = CONF_UNSET_PTR;    
    }
    if (cs->adminpass != CONF_UNSET_PTR) {
        sdsfree(cs->adminpass);
        cs->adminpass = CONF_UNSET_PTR;    
    }

    while (darray_n(&cs->commands_need_adminpass) > 0) {
        str = darray_pop(&cs->commands_need_adminpass);
        sdsfree(*str);
    }
    darray_deinit(&cs->commands_need_adminpass);
}

int
conf_server_get(const char *option_name, void *value)
{
    conf_option *opt;

    opt = dictFetchValue(cserver->ctable, option_name);
    if (opt == NULL)
        return VR_ERROR;

    return opt->get(cserver, opt, value);
}

int
conf_server_set(const char *option_name, conf_value *value)
{
    conf_option *opt;

    opt = dictFetchValue(cserver->ctable, option_name);
    if (opt == NULL || opt->flags&CONF_FIELD_FLAGS_NO_MODIFY)
        return VR_ERROR;

    return opt->set(cserver, opt, value);
}

static int conf_init(vr_conf *cf)
{
    int ret;

    if(cf == NULL){
        return VR_ERROR;
    }

    cf->fname = NULL;
    cf->organizations = NULL;
    cf->version = 0;
    pthread_rwlock_init(&cf->rwl, NULL);
    pthread_mutex_init(&cf->flock, NULL);

    cf->organizations = dictCreate(&OrganizationDictType, NULL);
    if (cf->organizations == NULL) {
        return VR_ERROR;
    }

    conf_server_init(&cf->cserver);

    conf = cf;
    
    return VR_OK;
}

static int conf_set_default(vr_conf *cf)
{
    CONF_WLOCK();
    conf_server_set_default(&cf->cserver);
    CONF_UNLOCK();
    return VR_OK;
}

static void conf_deinit(vr_conf *cf)
{
    if(cf == NULL){
        return;
    }

    if (cf->fname != NULL) {
        sdsfree(cf->fname);
        cf->fname = NULL;
    }

    if(cf->organizations != NULL){
        dictRelease(cf->organizations);
        cf->organizations = NULL;
    }

    conf_server_deinit(&cf->cserver);

    cf->version = 0;
    pthread_rwlock_destroy(&cf->rwl);
    pthread_mutex_destroy(&cf->flock);
}

static void
conf_server_dump(conf_server *cs, int log_level)
{
    if(cs == NULL){
        return;
    }

    log_debug(log_level, "  databases : %d", cs->databases);
    log_debug(log_level, "  internal_dbs_per_databases : %d", cs->internal_dbs_per_databases);
    log_debug(log_level, "  maxmemory : %lld", cs->maxmemory);
    log_debug(log_level, "  maxmemory_policy : %d", cs->maxmemory_policy);    
    log_debug(log_level, "  maxmemory_samples : %d", cs->maxmemory_samples);
    log_debug(log_level, "  max_time_complexity_limit : %lld", cs->max_time_complexity_limit);
}

static void
conf_dump(vr_conf *cf)
{
    int log_level = LOG_VERB;
    conf_server *cs;
    
    if(cf == NULL){
        return;
    }

    cs = &cf->cserver;
    log_debug(log_level, "server in conf file");
    conf_server_dump(cs, log_level);
    log_debug(log_level, "");
}

/* return -1: error
  * return 0: conf value is append
  * return 1: conf value is insert*/
static int
conf_key_value_insert(dict *org, sds key, conf_value *cv)
{
    if (key == NULL) {
        log_error("value in conf file has no key");
        return -1;
    }

    if (cv == NULL) {
        log_error("key %s in conf file has no value", key);
        return -1;
    }

    if (org == NULL) {
        log_error("key %s in conf file has no organization", 
            key);
        return -1;
    }
    
    if (dictAdd(org,key,cv) != DICT_OK) {
        dictEntry *de;
        conf_value *cv_old, *cv_new, **cv_sub;
        de = dictFind(org,key);
        cv_old = dictGetVal(de);
        if (cv_old->type != CONF_VALUE_TYPE_ARRAY) {
            cv_new = conf_value_create(CONF_VALUE_TYPE_ARRAY);
            cv_sub = darray_push(cv_new->value);
            *cv_sub = cv_old;
            cv_sub = darray_push(cv_new->value);
            *cv_sub = cv;
            dictSetVal(org,de,cv_new);
        } else {
            cv_sub = darray_push(cv_old->value);
            *cv_sub = cv;
        }
        return 0;
    }

    return 1;
}

static int
conf_pre_load_from_string(vr_conf *cf, char *config)
{
    int ret;
    int linenum = 0, totlines, i, j;
    int slaveof_linenum = 0;
    sds *lines = NULL;
    dict *org = NULL;
    sds org_name = NULL;
    dictEntry *de;
    sds key = NULL;
    conf_value *cv = NULL;

    lines = sdssplitlen(config,strlen(config),"\n",1,&totlines);

    for (i = 0; i < totlines; i++) {
        sds *argv;
        int argc;

        linenum = i+1;
        lines[i] = sdstrim(lines[i]," \t\r\n");

        /* Skip comments and blank lines */
        if (lines[i][0] == '#' || lines[i][0] == '\0') continue;

        if (lines[i][0] == '[') {
            if (sdslen(lines[i]) <= 2 || lines[i][sdslen(lines[i])-1] == ']') {
                log_error("Organization name %s in conf file %s error",
                    lines[i], cf->fname);
                goto loaderr;
            }
            org_name = sdsnewlen(lines[i]+1,sdslen(lines[i])-2);
            de = dictFind(cf->organizations,org_name);
            if (de == NULL) {
                org = dictCreate(&KeyValueDictType, NULL);
                dictAdd(cf->organizations,org_name,org);
            } else {
                org = dictGetVal(de);
                sdsfree(org_name);
            }
            
            continue;
        }

        /* Split into arguments */
        argv = sdssplitargs(lines[i],&argc);
        if (argv == NULL) {
            log_error("Unbalanced quotes in configuration line");
            goto loaderr;
        }

        /* Skip this line if the resulting command vector is empty. */
        if (argc == 0) {
            sdsfreesplitres(argv,argc);
            continue;
        }
        sdstolower(argv[0]);

        if (org == NULL) {
            org_name = sdsnew("server");
            org = dictCreate(&KeyValueDictType, NULL);
            dictAdd(cf->organizations,org_name,org);
        }

        key = argv[0];
        argv[0] = NULL;
        for (j = 1; j < argc; j ++) {
            cv = conf_value_create(CONF_VALUE_TYPE_STRING);
            cv->value = argv[j];
            argv[j] = NULL;
            ret = conf_key_value_insert(org, key, cv);
            if(ret == -1){
                sdsfreesplitres(argv,argc);
                sdsfree(key);
                conf_value_destroy(cv);
                log_error("key value insert into organization failed");
                goto loaderr;
            } else if (j == 1 && ret == 0) {
                sdsfree(key);
            }
        }

        sdsfreesplitres(argv,argc);
    }

    if (lines) {
        sdsfreesplitres(lines,linenum);
    }
    return VR_OK;
    
loaderr:
    if (lines) {
        sdsfreesplitres(lines,linenum);
    }
    return VR_ERROR;
}

static int
conf_pre_validate(vr_conf *cf)
{
    int ret;
    sds config = sdsempty();
    char buf[CONF_MAX_LINE+1];

    /* Load the file content */
    if (cf->fname) {
        FILE *fp;

        if (cf->fname[0] == '-' && cf->fname[1] == '\0') {
            fp = stdin;
        } else {
            if ((fp = fopen(cf->fname,"r")) == NULL) {
                log_error("Open config file '%s' failed: %s", cf->fname, strerror(errno));
                sdsfree(config);
                return VR_ERROR;
            }
        }
        while(fgets(buf,CONF_MAX_LINE+1,fp) != NULL)
            config = sdscat(config,buf);
        if (fp != stdin) fclose(fp);
    }

    ret = conf_pre_load_from_string(cf,config);
    if (ret != VR_OK) {
        sdsfree(config);
        return VR_ERROR;
    }
    
    sdsfree(config);
    return VR_OK;
}

static int
conf_parse_conf_server(conf_server *cs, dict *org)
{
    int ret;
    conf_option *opt;
    dictEntry *de;
    sds key;
    
    if(cs == NULL || org == NULL){
        return VR_ERROR;
    }
    
    key = sdsempty();
    for (opt = conf_server_options; opt&&opt->name; opt++) {
        key = sdscpy(key,opt->name);
        de = dictFind(org,key);
        if (de != NULL) {
            ret = opt->set(cs, opt, dictGetVal(de));
            if(ret != VR_OK){
                log_error("parse key %s in conf file error", key);
                sdsfree(key);
                return VR_ERROR;
            }
        }
    }

    sdsfree(key);
    return VR_OK;
}

static int
conf_parse(vr_conf *cf)
{
    int ret;
    dict *orgs, *org;
    dictEntry *de;
    sds key;
    
    if (cf == NULL) {
        return VR_ERROR;
    }

    orgs = cf->organizations;
    if (orgs == NULL) {
        return VR_ERROR;
    }

    /* server */
    key = sdsnew(CONF_ORGANIZATION_NAME_SERVER);
    de = dictFind(orgs, key);
    if (de == NULL) {
        log_error("can not find %s organization in conf file %s", 
            CONF_ORGANIZATION_NAME_SERVER, cf->fname);
        sdsfree(key);
        return VR_ERROR;
    }

    org = dictGetVal(de);
    if (org == NULL) {
        log_error("dict %s entry value is NULL", dictGetKey(de));
        sdsfree(key);
        return VR_ERROR;
    }

    ret = conf_parse_conf_server(&cf->cserver, org);
    if( ret != VR_OK) {
        log_error("common conf parse error");
        sdsfree(key);
        return VR_ERROR;
    }

    sdsfree(key);
    
    return VR_OK;
}

static int
conf_post_validate(vr_conf *cf)
{
    if(cf == NULL){
        return VR_ERROR;
    }

    if(cf->organizations != NULL){
        dictRelease(cf->organizations);
        cf->organizations = NULL;
    }
    
    return VR_OK;
}

static vr_conf *
conf_open(char *filename)
{
    int ret;
    vr_conf *cf = NULL;
    sds path = NULL;

    if (filename == NULL) {
        log_error("configuration file name is NULL.");
        return NULL;
    }

    path = getAbsolutePath(filename);
    if (path == NULL) {
        log_error("configuration file name '%s' is error.", filename);
        goto error;
    }

    cf = dalloc(sizeof(*cf));
    if (cf == NULL) {
        goto error;
    }

    ret = conf_init(cf);
    if(ret != VR_OK){
        goto error;
    }

    ret = conf_set_default(cf);
    if (ret != VR_OK) {
        goto error;
    }

    cf->fname = path;

    return cf;

error:

    if (cf != NULL) {
        conf_destroy(cf);
    }

    if (path != NULL) {
        sdsfree(path);
    }
    
    return NULL;
}

vr_conf *
conf_create(char *filename)
{
    int ret;
    vr_conf *cf;

    cf = conf_open(filename);
    if (cf == NULL) {
        return NULL;
    }

    /* validate configuration file before parsing */
    ret = conf_pre_validate(cf);
    if (ret != VR_OK) {
        goto error;
    }

    conf_organizations_dump(cf);

    /* parse the configuration file */
    ret = conf_parse(cf);
    if (ret != VR_OK) {
        goto error;
    }

    /* validate parsed configuration */
    ret = conf_post_validate(cf);
    if (ret != VR_OK) {
        goto error;
    }

    conf_dump(cf);

    cserver = &cf->cserver;

    return cf;

error:
    conf_destroy(cf);
    return NULL;
}

void 
conf_destroy(vr_conf *cf)
{
    if (cf == NULL) {
        return;
    }
    
    conf_deinit(cf);
    
    dfree(cf);
}

unsigned long long
conf_version_get(void)
{
    unsigned long long version;
    
    CONF_RLOCK();
    version = conf->version;
    CONF_UNLOCK();

    return version;
}

int
CONF_RLOCK(void)
{
    return pthread_rwlock_rdlock(&conf->rwl);
}

int
CONF_WLOCK(void)
{
    return pthread_rwlock_wrlock(&conf->rwl);
}

int
CONF_UNLOCK(void)
{
    return pthread_rwlock_unlock(&conf->rwl);
}

int
CONFF_LOCK(void)
{
    return pthread_mutex_lock(&conf->flock);
}

int
CONFF_UNLOCK(void)
{
    return pthread_mutex_unlock(&conf->flock);
}

const char *
get_evictpolicy_strings(int evictpolicy_type)
{
    return evictpolicy_strings[evictpolicy_type];
}

/*-----------------------------------------------------------------------------
 * CONFIG SET implementation
 *----------------------------------------------------------------------------*/

static void configSetCommand(client *c) {
    int ret;
    sds value;
    sds *fields;
    int fields_count = 0;
    conf_option *opt;
    conf_value *cv;
    
    serverAssertWithInfo(c,c->argv[2],sdsEncodedObject(c->argv[2]));
    serverAssertWithInfo(c,c->argv[3],sdsEncodedObject(c->argv[3]));

    opt = dictFetchValue(cserver->ctable, c->argv[2]->ptr);

    if (opt == NULL) {
        addReplyErrorFormat(c,"Unsupported CONFIG parameter: %s",
            (char*)c->argv[2]->ptr);
        return;
    } else if (opt->flags&CONF_FIELD_FLAGS_NO_MODIFY) {
        addReplyErrorFormat(c,"Unsupported modify this CONFIG parameter: %s",
            (char*)c->argv[2]->ptr);
        return;
    }

    value = c->argv[3]->ptr;

    /* Handle some special action before setting the config value if needed */
    if (!strcasecmp(c->argv[2]->ptr,CONFIG_SOPN_MAXCLIENTS)) {
        long maxclients;
        int filelimit, threads;
        if (string2l(value,sdslen(value),&maxclients) == 0 || maxclients < 1) goto badfmt;
        conf_server_get(CONFIG_SOPN_THREADS,&threads);
        
        filelimit = adjustOpenFilesLimit((int)maxclients);
        if ((filelimit-threads*2-CONFIG_MIN_RESERVED_FDS) != maxclients) {
            addReplyErrorFormat(c,"The operating system is not able to handle the specified number of clients");
            return;
        }
    } else if (!strcasecmp(c->argv[2]->ptr,CONFIG_SOPN_ADMINPASS)) {
        if (c->vel->cc.adminpass && c->authenticated < 2) {
            addReplyErrorFormat(c,"You need adminpass to set this CONFIG parameter: %s",
                (char*)c->argv[2]->ptr);
            return;
        }
    }

    fields = sdssplitlen(value,sdslen(value)," ",1,&fields_count);
    if (fields == NULL) {
        goto badfmt;
    } else if (fields_count == 0) {
        cv = conf_value_create(CONF_VALUE_TYPE_STRING);
        cv->value = sdsempty();
    } else if (fields_count == 1) {
        cv = conf_value_create(CONF_VALUE_TYPE_STRING);
        cv->value = fields[0];
        fields[0] = NULL;
    } else if (fields_count > 1) {
        conf_value **cv_sub;
        uint32_t i;
    
        cv = conf_value_create(CONF_VALUE_TYPE_ARRAY);
        for (i = 0; i < fields_count; i ++) {
            cv_sub = darray_push(cv->value);
            *cv_sub = conf_value_create(CONF_VALUE_TYPE_STRING);
            (*cv_sub)->value = fields[i];
            fields[i] = NULL;
        }
    } else {
        log_debug(LOG_NOTICE, "fields_count: %d", fields_count);
        serverPanic("Error config set value");
    }
    sdsfreesplitres(fields,fields_count);

    ret = opt->set(cserver, opt, cv);
    conf_value_destroy(cv);
    if (ret != VR_OK) {
        goto badfmt;
    }

    /* Handle some special action after setting the config value if needed */
    if (!strcmp(opt->name,CONFIG_SOPN_MAXMEMORY)) {
        long long maxmemory;
        conf_server_get(CONFIG_SOPN_MAXMEMORY,&maxmemory);
        if (maxmemory) {
            if (maxmemory < dalloc_used_memory()) {
                log_warn("WARNING: the new maxmemory value set via CONFIG SET is smaller than the current memory usage. This will result in keys eviction and/or inability to accept new write commands depending on the maxmemory-policy.");
                freeMemoryIfNeeded(c->vel);
            }
        }
    }

    /* On success we just return a generic OK for all the options. */
    addReply(c,shared.ok);
    return;

badfmt: /* Bad format errors */
    addReplyErrorFormat(c,"Invalid argument '%s' for CONFIG SET '%s'",
        (char*)value,
        (char*)c->argv[2]->ptr);
}

/*-----------------------------------------------------------------------------
 * CONFIG GET implementation
 *----------------------------------------------------------------------------*/

static void addReplyConfOption(client *c,conf_option *cop)
{
    addReplyBulkCString(c,cop->name);
    if (cop->type == CONF_FIELD_TYPE_INT) {
        int value;
        conf_server_get(cop->name,&value);
        
        if (!strcmp(cop->name,CONFIG_SOPN_MAXMEMORYP)) {
            addReplyBulkCString(c,get_evictpolicy_strings(value));
        } else {
            addReplyBulkLongLong(c,value);
        }
    } else if (cop->type == CONF_FIELD_TYPE_LONGLONG) {
        long long value;
        conf_server_get(cop->name,&value);
        addReplyBulkLongLong(c,value);
    } else if (cop->type == CONF_FIELD_TYPE_SDS) {
        sds value;
        conf_server_get(cop->name,&value);
        if (value == NULL) {
            addReplyBulkCString(c,"");
        } else {
            addReplyBulkSds(c,value);
        }
    } else if (cop->type == CONF_FIELD_TYPE_ARRAYSDS) {
        struct darray values;
        sds value = sdsempty();
        sds *elem;

        darray_init(&values,1,sizeof(sds));
        conf_server_get(cop->name,&values);
        while(darray_n(&values) > 0) {
            elem = darray_pop(&values);
            value = sdscatsds(value,*elem);
            value = sdscat(value," ");
            sdsfree(*elem);
        }
        darray_deinit(&values);
        if (sdslen(value) > 0) sdsrange(value,0,-2);
        addReplyBulkSds(c,value);
    } else {
        serverPanic("Error conf field type");
    }
}

static void configGetCommand(client *c) {
    robj *o = c->argv[2];
    char *pattern = o->ptr;
    conf_option *cop;
    serverAssertWithInfo(c,o,sdsEncodedObject(o));

    cop = dictFetchValue(cserver->ctable, pattern);
    if (cop != NULL) {
        /* Don't show adminpass if user has no right. */
        if (!strcmp(cop->name,CONFIG_SOPN_ADMINPASS) && 
            c->vel->cc.adminpass && c->authenticated < 2) {
            addReply(c,shared.noadminerr);
        } else {
            addReplyMultiBulkLen(c,2);
            addReplyConfOption(c,cop);
        }
    } else {
        int matches = 0;
        void * replylen = addDeferredMultiBulkLength(c);
        for (cop = conf_server_options; cop&&cop->name; cop++) {
            if (stringmatch(pattern,cop->name,1)) {
                /* Don't show adminpass if user has no right. */
                if (!strcmp(cop->name,CONFIG_SOPN_ADMINPASS) && 
                    c->vel->cc.adminpass && c->authenticated < 2)
                    continue;
                
                addReplyConfOption(c,cop);
                matches ++;
            }
        }
        setDeferredMultiBulkLength(c,replylen,matches*2);
    }
}

/*-----------------------------------------------------------------------------
 * CONFIG REWRITE implementation
 *----------------------------------------------------------------------------*/

/* The config rewrite state. */
struct rewriteConfigState {
    dict *option_to_line; /* Option -> list of config file lines map */
    dict *rewritten;      /* Dictionary of already processed options */
    int numlines;         /* Number of lines in current config */
    sds *lines;           /* Current lines as an array of sds strings */
    int has_tail;         /* True if we already added directives that were
                             not present in the original config file. */
};

/* Append the new line to the current configuration state. */
static void rewriteConfigAppendLine(struct rewriteConfigState *state, sds line) {
    state->lines = drealloc(state->lines, sizeof(char*) * (state->numlines+1));
    state->lines[state->numlines++] = line;
}

/* Populate the option -> list of line numbers map. */
static void rewriteConfigAddLineNumberToOption(struct rewriteConfigState *state, sds option, int linenum) {
    dlist *l = dictFetchValue(state->option_to_line,option);

    if (l == NULL) {
        l = dlistCreate();
        dictAdd(state->option_to_line,sdsdup(option),l);
    }
    dlistAddNodeTail(l,(void*)(long)linenum);
}

dictType optionToLineDictType = {
    dictSdsCaseHash,            /* hash function */
    NULL,                       /* key dup */
    NULL,                       /* val dup */
    dictSdsKeyCaseCompare,      /* key compare */
    dictSdsDestructor,          /* key destructor */
    dictListDestructor          /* val destructor */
};

dictType optionSetDictType = {
    dictSdsCaseHash,            /* hash function */
    NULL,                       /* key dup */
    NULL,                       /* val dup */
    dictSdsKeyCaseCompare,      /* key compare */
    dictSdsDestructor,          /* key destructor */
    NULL                        /* val destructor */
};

#define CONFIG_MAX_LINE    1024
#define REDIS_CONFIG_REWRITE_SIGNATURE "# Generated by CONFIG REWRITE"
/* Read the old file, split it into lines to populate a newly created
 * config rewrite state, and return it to the caller.
 *
 * If it is impossible to read the old file, NULL is returned.
 * If the old file does not exist at all, an empty state is returned. */
static struct rewriteConfigState *rewriteConfigReadOldFile(char *path) {
    FILE *fp = fopen(path,"r");
    struct rewriteConfigState *state = dalloc(sizeof(*state));
    char buf[CONFIG_MAX_LINE+1];
    int linenum = -1;

    if (fp == NULL && errno != ENOENT) return NULL;

    state->option_to_line = dictCreate(&optionToLineDictType,NULL);
    state->rewritten = dictCreate(&optionSetDictType,NULL);
    state->numlines = 0;
    state->lines = NULL;
    state->has_tail = 0;
    if (fp == NULL) return state;

    /* Read the old file line by line, populate the state. */
    while(fgets(buf,CONFIG_MAX_LINE+1,fp) != NULL) {
        int argc;
        sds *argv;
        sds line = sdstrim(sdsnew(buf),"\r\n\t ");

        linenum++; /* Zero based, so we init at -1 */

        /* Handle comments and empty lines. */
        if (line[0] == '#' || line[0] == '\0') {
            if (!state->has_tail && !strcmp(line,REDIS_CONFIG_REWRITE_SIGNATURE))
                state->has_tail = 1;
            rewriteConfigAppendLine(state,line);
            continue;
        }

        /* Not a comment, split into arguments. */
        argv = sdssplitargs(line,&argc);
        if (argv == NULL) {
            /* Apparently the line is unparsable for some reason, for
             * instance it may have unbalanced quotes. Load it as a
             * comment. */
            sds aux = sdsnew("# ??? ");
            aux = sdscatsds(aux,line);
            sdsfree(line);
            rewriteConfigAppendLine(state,aux);
            continue;
        }

        sdstolower(argv[0]); /* We only want lowercase config directives. */

        /* Now we populate the state according to the content of this line.
         * Append the line and populate the option -> line numbers map. */
        rewriteConfigAppendLine(state,line);
        rewriteConfigAddLineNumberToOption(state,argv[0],linenum);

        sdsfreesplitres(argv,argc);
    }
    fclose(fp);
    return state;
}

/* Add the specified option to the set of processed options.
 * This is useful as only unused lines of processed options will be blanked
 * in the config file, while options the rewrite process does not understand
 * remain untouched. */
static void rewriteConfigMarkAsProcessed(struct rewriteConfigState *state, const char *option) {
    sds opt = sdsnew(option);

    if (dictAdd(state->rewritten,opt,NULL) != DICT_OK) sdsfree(opt);
}

/* Rewrite the specified configuration option with the new "line".
 * It progressively uses lines of the file that were already used for the same
 * configuration option in the old version of the file, removing that line from
 * the map of options -> line numbers.
 *
 * If there are lines associated with a given configuration option and
 * "force" is non-zero, the line is appended to the configuration file.
 * Usually "force" is true when an option has not its default value, so it
 * must be rewritten even if not present previously.
 *
 * The first time a line is appended into a configuration file, a comment
 * is added to show that starting from that point the config file was generated
 * by CONFIG REWRITE.
 *
 * "line" is either used, or freed, so the caller does not need to free it
 * in any way. */
static void rewriteConfigRewriteLine(struct rewriteConfigState *state, const char *option, sds line, int force) {
    sds o = sdsnew(option);
    dlist *l = dictFetchValue(state->option_to_line,o);

    rewriteConfigMarkAsProcessed(state,option);

    if (!l && !force) {
        /* Option not used previously, and we are not forced to use it. */
        sdsfree(line);
        sdsfree(o);
        return;
    }

    if (l) {
        dlistNode *ln = dlistFirst(l);
        int linenum = (long) ln->value;

        /* There are still lines in the old configuration file we can reuse
         * for this option. Replace the line with the new one. */
        dlistDelNode(l,ln);
        if (dlistLength(l) == 0) dictDelete(state->option_to_line,o);
        sdsfree(state->lines[linenum]);
        state->lines[linenum] = line;
    } else {
        /* Append a new line. */
        if (!state->has_tail) {
            rewriteConfigAppendLine(state,
                sdsnew(REDIS_CONFIG_REWRITE_SIGNATURE));
            state->has_tail = 1;
        }
        rewriteConfigAppendLine(state,line);
    }
    sdsfree(o);
}

/* Free the configuration rewrite state. */
static void rewriteConfigReleaseState(struct rewriteConfigState *state) {
    sdsfreesplitres(state->lines,state->numlines);
    dictRelease(state->option_to_line);
    dictRelease(state->rewritten);
    dfree(state);
}

/* At the end of the rewrite process the state contains the remaining
 * map between "option name" => "lines in the original config file".
 * Lines used by the rewrite process were removed by the function
 * rewriteConfigRewriteLine(), all the other lines are "orphaned" and
 * should be replaced by empty lines.
 *
 * This function does just this, iterating all the option names and
 * blanking all the lines still associated. */
static void rewriteConfigRemoveOrphaned(struct rewriteConfigState *state) {
    dictIterator *di = dictGetIterator(state->option_to_line);
    dictEntry *de;

    while((de = dictNext(di)) != NULL) {
        dlist *l = dictGetVal(de);
        sds option = dictGetKey(de);

        /* Don't blank lines about options the rewrite process
         * don't understand. */
        if (dictFind(state->rewritten,option) == NULL) {
            log_debug(LOG_DEBUG,"Not rewritten option: %s", option);
            continue;
        }

        while(dlistLength(l)) {
            dlistNode *ln = dlistFirst(l);
            int linenum = (long) ln->value;

            sdsfree(state->lines[linenum]);
            state->lines[linenum] = sdsempty();
            dlistDelNode(l,ln);
        }
    }
    dictReleaseIterator(di);
}

/* Glue together the configuration lines in the current configuration
 * rewrite state into a single string, stripping multiple empty lines. */
static sds rewriteConfigGetContentFromState(struct rewriteConfigState *state) {
    sds content = sdsempty();
    int j, was_empty = 0;

    for (j = 0; j < state->numlines; j++) {
        /* Every cluster of empty lines is turned into a single empty line. */
        if (sdslen(state->lines[j]) == 0) {
            if (was_empty) continue;
            was_empty = 1;
        } else {
            was_empty = 0;
        }
        content = sdscatsds(content,state->lines[j]);
        content = sdscatlen(content,"\n",1);
    }
    return content;
}

/* This function overwrites the old configuration file with the new content.
 *
 * 1) The old file length is obtained.
 * 2) If the new content is smaller, padding is added.
 * 3) A single write(2) call is used to replace the content of the file.
 * 4) Later the file is truncated to the length of the new content.
 *
 * This way we are sure the file is left in a consistent state even if the
 * process is stopped between any of the four operations.
 *
 * The function returns 0 on success, otherwise -1 is returned and errno
 * set accordingly. */
static int rewriteConfigOverwriteFile(char *configfile, sds content) {
    int retval = 0;
    int fd = open(configfile,O_RDWR|O_CREAT,0644);
    int content_size = sdslen(content), padding = 0;
    struct stat sb;
    sds content_padded;

    /* 1) Open the old file (or create a new one if it does not
     *    exist), get the size. */
    if (fd == -1) return -1; /* errno set by open(). */
    if (fstat(fd,&sb) == -1) {
        close(fd);
        return -1; /* errno set by fstat(). */
    }

    /* 2) Pad the content at least match the old file size. */
    content_padded = sdsdup(content);
    if (content_size < sb.st_size) {
        /* If the old file was bigger, pad the content with
         * a newline plus as many "#" chars as required. */
        padding = sb.st_size - content_size;
        content_padded = sdsgrowzero(content_padded,sb.st_size);
        content_padded[content_size] = '\n';
        memset(content_padded+content_size+1,'#',padding-1);
    }

    /* 3) Write the new content using a single write(2). */
    if (write(fd,content_padded,strlen(content_padded)) == -1) {
        retval = -1;
        goto cleanup;
    }

    /* 4) Truncate the file to the right length if we used padding. */
    if (padding) {
        if (ftruncate(fd,content_size) == -1) {
            /* Non critical error... */
        }
    }

cleanup:
    sdsfree(content_padded);
    close(fd);
    return retval;
}

/* Rewrite a numerical (int range) option. */
static void rewriteConfigIntOption(struct rewriteConfigState *state, char *option, int defvalue) {
    int value;
    int force;
    sds line;

    conf_server_get(option,&value);
    line = sdscatprintf(sdsempty(),"%s %d",option,value);
    force = value != defvalue;

    rewriteConfigRewriteLine(state,option,line,force);
}

/* Rewrite a numerical (int range) option. */
static void rewriteConfigSdsOption(struct rewriteConfigState *state, char *option, sds defvalue) {
    sds value;
    int force;
    sds line;

    conf_server_get(option,&value);
    if (defvalue == NULL && value == NULL) {
        force = 0;
    } else if (defvalue != NULL && value != NULL && !sdscmp(value,defvalue)) {
        force = 0;
    } else {
        force = 1;
    }

    if (value == NULL) {
        line = sdscatprintf(sdsempty(),"%s \"\"",option);
    } else {
        line = sdscatprintf(sdsempty(),"%s %s",option,value);
        sdsfree(value);
    }
    
    rewriteConfigRewriteLine(state,option,line,force);
}

/* Rewrite a numerical (long long range) option. */
static void rewriteConfigLongLongOption(struct rewriteConfigState *state, char *option, long long defvalue) {
    long long value;
    int force;
    sds line;

    conf_server_get(option,&value);
    line = sdscatprintf(sdsempty(),"%s %lld",option,value);
    force = value != defvalue;

    rewriteConfigRewriteLine(state,option,line,force);
}

/* Write the long long 'bytes' value as a string in a way that is parsable
 * inside redis.conf. If possible uses the GB, MB, KB notation. */
static int rewriteConfigFormatMemory(char *buf, size_t len, long long bytes) {
    int gb = 1024*1024*1024;
    int mb = 1024*1024;
    int kb = 1024;

    if (bytes && (bytes % gb) == 0) {
        return snprintf(buf,len,"%lldgb",bytes/gb);
    } else if (bytes && (bytes % mb) == 0) {
        return snprintf(buf,len,"%lldmb",bytes/mb);
    } else if (bytes && (bytes % kb) == 0) {
        return snprintf(buf,len,"%lldkb",bytes/kb);
    } else {
        return snprintf(buf,len,"%lld",bytes);
    }
}

/* Rewrite a simple "option-name <bytes>" configuration option. */
static void rewriteConfigBytesOption(struct rewriteConfigState *state, char *option, long long defvalue) {
     long long value;
    char buf[64];
    int force;
    sds line;

    conf_server_get(option,&value);
    force = value != defvalue;

    rewriteConfigFormatMemory(buf,sizeof(buf),value);
    line = sdscatprintf(sdsempty(),"%s %s",option,buf);
    rewriteConfigRewriteLine(state,option,line,force);
}

/* Rewrite an enumeration option. It takes as usually state and option name,
 * and in addition the enumeration array and the default value for the
 * option. */
static void rewriteConfigEnumOption(struct rewriteConfigState *state, char *option, configEnumGetStrFun fun, int defval) {
    int value;
    sds line;
    const char *name;
    int force;

    conf_server_get(option,&value);
    force = value != defval;
    name = fun(value);
    line = sdscatprintf(sdsempty(),"%s %s",option,name);
    rewriteConfigRewriteLine(state,option,line,force);
}

/* Rewrite the bind option. */
static void rewriteConfigBindOption(struct rewriteConfigState *state) {
    struct darray values;
    sds *value, line;
    int force = 1;
    char *option = CONFIG_SOPN_BIND;

    darray_init(&values,1,sizeof(sds));
    conf_server_get(option,&values);
    /* Nothing to rewrite if we don't have bind addresses. */
    if (darray_n(&values) == 0) {
        darray_deinit(&values);
        rewriteConfigMarkAsProcessed(state,option);
        return;
    }

    /* Rewrite as bind <addr1> <addr2> ... <addrN> */
    line = sdsnew(option);
    while(darray_n(&values) > 0) {
        line = sdscat(line," ");
        value = darray_pop(&values);
        line = sdscatsds(line,*value);
        sdsfree(*value);
    }
    darray_deinit(&values);

    rewriteConfigRewriteLine(state,option,line,force);
}

/* Rewrite the save option. */
void rewriteConfigCommandsNAPOption(struct rewriteConfigState *state) {
    struct darray values;
    sds *value, line;
    int force = 1;
    char *option = CONFIG_SOPN_COMMANDSNAP;

    darray_init(&values,1,sizeof(sds));
    conf_server_get(option,&values);
    /* Nothing to rewrite if we don't have commands that need adminpass. */
    if (darray_n(&values) == 0) {
        darray_deinit(&values);
        rewriteConfigMarkAsProcessed(state,option);
        return;
    }

    while(darray_n(&values) > 0) {
        value = darray_pop(&values);
        line = sdscatprintf(sdsempty(),"%s %s",option,*value);
        rewriteConfigRewriteLine(state,option,line,force);
        sdsfree(*value);
    }
    darray_deinit(&values);
    rewriteConfigMarkAsProcessed(state,option);
}

/* Rewrite the configuration file at "path".
 * If the configuration file already exists, we try at best to retain comments
 * and overall structure.
 *
 * Configuration parameters that are at their default value, unless already
 * explicitly included in the old configuration file, are not rewritten.
 *
 * On error -1 is returned and errno is set accordingly, otherwise 0. */
static int rewriteConfig(char *path) {
    struct rewriteConfigState *state;
    sds newcontent;
    int retval;
    conf_option *cop;

    CONFF_LOCK();
    /* Step 1: read the old config into our rewrite state. */
    if ((state = rewriteConfigReadOldFile(path)) == NULL) {
        CONFF_UNLOCK();
        return -1;
    }

    /* Step 2: rewrite every single option, replacing or appending it inside
     * the rewrite state. */
    rewriteConfigIntOption(state,CONFIG_SOPN_DATABASES,CONFIG_DEFAULT_LOGICAL_DBNUM);
    rewriteConfigIntOption(state,CONFIG_SOPN_IDPDATABASE,CONFIG_DEFAULT_INTERNAL_DBNUM);
    rewriteConfigBytesOption(state,CONFIG_SOPN_MAXMEMORY,CONFIG_DEFAULT_MAXMEMORY);
    rewriteConfigEnumOption(state,CONFIG_SOPN_MAXMEMORYP,get_evictpolicy_strings,CONFIG_DEFAULT_MAXMEMORY_POLICY);
    rewriteConfigIntOption(state,CONFIG_SOPN_MAXMEMORYS,CONFIG_DEFAULT_MAXMEMORY_SAMPLES);
    rewriteConfigLongLongOption(state,CONFIG_SOPN_MTCLIMIT,CONFIG_DEFAULT_MAX_TIME_COMPLEXITY_LIMIT);
    rewriteConfigBindOption(state);
    rewriteConfigIntOption(state,CONFIG_SOPN_PORT,CONFIG_DEFAULT_SERVER_PORT);
    rewriteConfigIntOption(state,CONFIG_SOPN_THREADS,CONFIG_DEFAULT_THREADS_NUM);
    rewriteConfigLongLongOption(state,CONFIG_SOPN_SLOWLOGLST,CONFIG_DEFAULT_SLOWLOG_LOG_SLOWER_THAN);
    rewriteConfigIntOption(state,CONFIG_SOPN_SLOWLOGML,CONFIG_DEFAULT_SLOWLOG_MAX_LEN);
    rewriteConfigIntOption(state,CONFIG_SOPN_MAXCLIENTS,CONFIG_DEFAULT_MAX_CLIENTS);
    rewriteConfigSdsOption(state,CONFIG_SOPN_REQUIREPASS,NULL);
    rewriteConfigSdsOption(state,CONFIG_SOPN_ADMINPASS,NULL);
    rewriteConfigCommandsNAPOption(state);
    
    /* Step 3: remove all the orphaned lines in the old file, that is, lines
     * that were used by a config option and are no longer used, like in case
     * of multiple "save" options or duplicated options. */
    rewriteConfigRemoveOrphaned(state);

    /* Step 4: generate a new configuration file from the modified state
     * and write it into the original file. */
    newcontent = rewriteConfigGetContentFromState(state);
    retval = rewriteConfigOverwriteFile(server.configfile,newcontent);
    CONFF_UNLOCK();

    sdsfree(newcontent);
    rewriteConfigReleaseState(state);
    return retval;
}

/*-----------------------------------------------------------------------------
 * CONFIG command entry point
 *----------------------------------------------------------------------------*/

void configCommand(client *c) {
    /* Only allow CONFIG GET while loading. */
    if (server.loading && strcasecmp(c->argv[1]->ptr,"get")) {
        addReplyError(c,"Only CONFIG GET is allowed during loading");
        return;
    }

    if (!strcasecmp(c->argv[1]->ptr,"set")) {
        if (c->argc != 4) goto badarity;
        configSetCommand(c);
    } else if (!strcasecmp(c->argv[1]->ptr,"get")) {
        if (c->argc != 3) goto badarity;
        configGetCommand(c);
    } /*else if (!strcasecmp(c->argv[1]->ptr,"resetstat")) {
        if (c->argc != 2) goto badarity;
        resetServerStats();
        resetCommandTableStats();
        addReply(c,shared.ok);
    }*/ else if (!strcasecmp(c->argv[1]->ptr,"rewrite")) {
        if (c->argc != 2) goto badarity;
        if (server.configfile == NULL) {
            addReplyError(c,"The server is running without a config file");
            return;
        }
        if (rewriteConfig(server.configfile) == -1) {
            log_warn("CONFIG REWRITE failed: %s", strerror(errno));
            addReplyErrorFormat(c,"Rewriting config file: %s", strerror(errno));
        } else {
            log_warn("CONFIG REWRITE executed with success.");
            addReply(c,shared.ok);
        }
    } else {
        addReplyError(c,
            //"CONFIG subcommand must be one of GET, SET, RESETSTAT, REWRITE");
            "CONFIG subcommand must be GET, SET, REWRITE");
    }
    return;

badarity:
    addReplyErrorFormat(c,"Wrong number of arguments for CONFIG %s",
        (char*) c->argv[1]->ptr);
}

int
conf_cache_init(conf_cache *cc)
{
    cc->cache_version = 0;
    conf_server_get(CONFIG_SOPN_MAXCLIENTS,&cc->maxclients);
    conf_server_get(CONFIG_SOPN_REQUIREPASS,&cc->requirepass);
    conf_server_get(CONFIG_SOPN_ADMINPASS,&cc->adminpass);
    conf_server_get(CONFIG_SOPN_MAXMEMORY,&cc->maxmemory);
    conf_server_get(CONFIG_SOPN_MTCLIMIT,&cc->max_time_complexity_limit);
    conf_server_get(CONFIG_SOPN_SLOWLOGLST,&cc->slowlog_log_slower_than);

    return VR_OK;
}

int
conf_cache_deinit(conf_cache *cc)
{
    cc->cache_version = 0;
    if (cc->requirepass != NULL) {
        sdsfree(cc->requirepass);
        cc->requirepass = NULL;
    }
    if (cc->adminpass != NULL) {
        sdsfree(cc->adminpass);
        cc->adminpass = NULL;
    }

    return VR_OK;
}

int
conf_cache_update(conf_cache *cc)
{
    unsigned long long cversion = conf_version_get();

    /* Not need update conf cache. */
    if (cversion <= cc->cache_version) {
        return;
    }

    if (cc->requirepass != NULL) {
        sdsfree(cc->requirepass);
        cc->requirepass = NULL;
    }
    if (cc->adminpass != NULL) {
        sdsfree(cc->adminpass);
        cc->adminpass = NULL;
    }

    conf_server_get(CONFIG_SOPN_MAXCLIENTS,&cc->maxclients);
    conf_server_get(CONFIG_SOPN_REQUIREPASS,&cc->requirepass);
    conf_server_get(CONFIG_SOPN_ADMINPASS,&cc->adminpass);
    conf_server_get(CONFIG_SOPN_MAXMEMORY,&cc->maxmemory);
    conf_server_get(CONFIG_SOPN_MTCLIMIT,&cc->max_time_complexity_limit);
    conf_server_get(CONFIG_SOPN_SLOWLOGLST,&cc->slowlog_log_slower_than);

    cc->cache_version = cversion;

    return VR_OK;
}


================================================
FILE: src/vr_conf.h
================================================
#ifndef _VR_CONF_H_
#define _VR_CONF_H_

/* Config server option name */
#define CONFIG_SOPN_DATABASES    "databases"
#define CONFIG_SOPN_IDPDATABASE  "internal-dbs-per-databases"
#define CONFIG_SOPN_MAXMEMORY    "maxmemory"
#define CONFIG_SOPN_MAXMEMORYP   "maxmemory-policy"
#define CONFIG_SOPN_MAXMEMORYS   "maxmemory-samples"
#define CONFIG_SOPN_MTCLIMIT     "max-time-complexity-limit"
#define CONFIG_SOPN_BIND         "bind"
#define CONFIG_SOPN_PORT         "port"
#define CONFIG_SOPN_THREADS      "threads"
#define CONFIG_SOPN_DIR          "dir"
#define CONFIG_SOPN_MAXCLIENTS   "maxclients"
#define CONFIG_SOPN_SLOWLOGLST   "slowlog-log-slower-than"
#define CONFIG_SOPN_SLOWLOGML    "slowlog-max-len"
#define CONFIG_SOPN_REQUIREPASS  "requirepass"
#define CONFIG_SOPN_ADMINPASS    "adminpass"
#define CONFIG_SOPN_COMMANDSNAP  "commands-need-adminpass"

#define CONFIG_RUN_ID_SIZE 40
#define CONFIG_DEFAULT_ACTIVE_REHASHING 1

#define CONFIG_DEFAULT_LOGICAL_DBNUM    6
#define CONFIG_DEFAULT_INTERNAL_DBNUM   6

#define CONFIG_DEFAULT_MAXMEMORY 0
#define CONFIG_DEFAULT_MAXMEMORY_SAMPLES 5
#define CONFIG_DEFAULT_MAX_CLIENTS 10000

#define CONFIG_DEFAULT_MAX_CLIENTS 10000

#define CONFIG_DEFAULT_THREADS_NUM (sysconf(_SC_NPROCESSORS_ONLN)>6?6:sysconf(_SC_NPROCESSORS_ONLN))

#define CONFIG_DEFAULT_HOST "0.0.0.0"

#define CONFIG_DEFAULT_SERVER_PORT 55555

#define CONFIG_DEFAULT_DATA_DIR "viredata"

#define CONFIG_DEFAULT_MAX_TIME_COMPLEXITY_LIMIT 0 /* Not limited */

#define CONFIG_DEFAULT_SLOWLOG_LOG_SLOWER_THAN 10000
#define CONFIG_DEFAULT_SLOWLOG_MAX_LEN 128

#define CONFIG_AUTHPASS_MAX_LEN 512

#define CONFIG_BINDADDR_MAX 16

#define CONF_UNSET_NUM      -1
#define CONF_UNSET_PTR      NULL
#define CONF_UNSET_GROUP    (group_type_t) -1
#define CONF_UNSET_HASH     (hash_type_t) -1
#define CONF_UNSET_DIST     (dist_type_t) -1

/* Config field data type for conf_option struct */
#define CONF_FIELD_TYPE_INT         0
#define CONF_FIELD_TYPE_LONGLONG    1
#define CONF_FIELD_TYPE_SDS         2
#define CONF_FIELD_TYPE_ARRAYSDS    3

/* Config field flags for conf_option struct */
#define CONF_FIELD_FLAGS_NO_MODIFY  (1<<0)

typedef struct conf_option {
    char    *name;      /* option name */
    int     type;       /* value type */
    int     flags;      /* option flags */
    int     (*set)(void *cf, struct conf_option *opt, void *data);
    int     (*get)(void *cf, struct conf_option *opt, void *data);
    int     offset;     /* offset of this option field in the struct  */
}conf_option;

#define EVICTPOLICY_CODEC(ACTION)                           \
    ACTION( MAXMEMORY_VOLATILE_LRU,     volatile-lru)       \
    ACTION( MAXMEMORY_VOLATILE_RANDOM,  volatile-random)    \
    ACTION( MAXMEMORY_VOLATILE_TTL,     volatile-ttl)       \
    ACTION( MAXMEMORY_ALLKEYS_LRU,      allkeys-lru)        \
    ACTION( MAXMEMORY_ALLKEYS_RANDOM,   allkeys-random)     \
    ACTION( MAXMEMORY_NO_EVICTION,      noeviction)         \

#define DEFINE_ACTION(_policy, _name) _policy,
typedef enum evictpolicy_type {
    EVICTPOLICY_CODEC( DEFINE_ACTION )
    EVICTPOLICY_SENTINEL
} evictpolicy_type_t;
#undef DEFINE_ACTION

typedef struct conf_server {
    dict          *ctable;

    int           databases;
    int           internal_dbs_per_databases;

    /* Limits */
    long long     max_time_complexity_limit;
    long long     maxmemory;            /* Max number of memory bytes to use */
    int           maxmemory_policy;     /* Policy for key eviction */
    int           maxmemory_samples;    /* Pricision of random sampling */
    int           maxclients;           /* Max number of simultaneous clients */

    int           threads;

    struct darray  binds;                /* Type: sds */
    int           port;

    sds           dir;

    long long     slowlog_log_slower_than;  /* SLOWLOG time limit (to get logged) */
    int           slowlog_max_len;      /* SLOWLOG max number of items logged */

    sds           requirepass;          /* Pass for AUTH command, or NULL */
    sds           adminpass;            /* Pass for ADMIN command, or NULL */
    struct darray  commands_need_adminpass;
} conf_server;

typedef struct vr_conf {
    sds           fname;             /* file name , absolute path */

    dict          *organizations;    /* organizations */

    conf_server   cserver;

    unsigned long long version;      /* config version */
    pthread_rwlock_t rwl;            /* config read write lock */
    pthread_mutex_t flock;           /* config file lock */
}vr_conf;

#define CONF_VALUE_TYPE_UNKNOW   0
#define CONF_VALUE_TYPE_STRING   1
#define CONF_VALUE_TYPE_ARRAY    2

typedef struct conf_value{
    int     type;
    void    *value;
}conf_value;

/* Config option used multi times for every loop, 
 * so we cache them here in the cron function. */
typedef struct conf_cache {
    unsigned long long cache_version;

    int maxclients;
    sds requirepass;
    sds adminpass;
    long long maxmemory;
    long long max_time_complexity_limit;
    long long slowlog_log_slower_than;
}conf_cache;

extern vr_conf *conf;
extern conf_server *cserver;

conf_value *conf_value_create(int type);
void conf_value_destroy(conf_value *cv);

vr_conf *conf_create(char *filename);
void conf_destroy(vr_conf *cf);

unsigned long long conf_version_get(void);

int conf_server_get(const char *option_name, void *value);
int conf_server_set(const char *option_name, conf_value *value);

int conf_set_maxmemory(void *obj, conf_option *opt, void *data);
int conf_set_maxmemory_policy(void *obj, conf_option *opt, void *data);
int conf_set_int_non_zero(void *obj, conf_option *opt, void *data);

int conf_get_sds(void *obj, conf_option *opt, void *data);
int conf_get_int(void *obj, conf_option *opt, void *data);
int conf_get_longlong(void *obj, conf_option *opt, void *data);
int conf_get_array_sds(void *obj, conf_option *opt, void *data);

int conf_set_sds(void *obj, conf_option *opt, void *data);
int conf_set_password(void *obj, conf_option *opt, void *data);
int conf_set_int(void *obj, conf_option *opt, void *data);
int conf_set_longlong(void *obj, conf_option *opt, void *data);
int conf_set_yesorno(void *obj, conf_option *opt, void *data);
int conf_set_array_sds(void *obj, conf_option *opt, void *data);
int conf_set_commands_need_adminpass(void *obj, conf_option *opt, void *data);

int CONF_RLOCK(void);
int CONF_WLOCK(void);
int CONF_UNLOCK(void);

int CONFF_LOCK(void);
int CONFF_UNLOCK(void);

const char *get_evictpolicy_strings(int evictpolicy_type);

void configCommand(struct client *c);

int conf_cache_init(conf_cache *cc);
int conf_cache_deinit(conf_cache *cc);
int conf_cache_update(conf_cache *cc);

#endif


================================================
FILE: src/vr_connection.c
================================================
#include <sys/uio.h>

#include <vr_core.h>

static void conn_free(struct conn *conn);

static struct conn *
_conn_get(conn_base *cb)
{
    struct conn *conn;

    if (cb != NULL && dlistLength(cb->free_connq) > 0) {
        conn = dlistPop(cb->free_connq);
    } else {
        conn = dalloc(sizeof(*conn));
        if (conn == NULL) {
            return NULL;
        }
        conn->cb = cb;

        conn->inqueue = NULL;
        conn->outqueue = NULL;
    }

    conn->owner = NULL;

    conn->sd = -1;

    conn->send_bytes = 0;
    conn->recv_bytes = 0;

    conn->err = 0;
    conn->recv_active = 0;
    conn->recv_ready = 0;
    conn->send_active = 0;
    conn->send_ready = 0;

    conn->connecting = 0;
    conn->connected = 0;
    conn->eof = 0;
    conn->done = 0;

    if (conn->inqueue == NULL) {
        conn->inqueue = dlistCreate();
        if (conn->inqueue == NULL) {
            conn_free(conn);
            return NULL;
        }
    }

    if (conn->outqueue == NULL) {
        conn->outqueue = dlistCreate();
        if (conn->outqueue == NULL) {
            conn_free(conn);
            return NULL;
        }
    }
    
    if (cb != NULL) {
        cb->ntotal_conn++;
        cb->ncurr_conn++;
    }
    
    return conn;
}

struct conn *
conn_get(conn_base *cb)
{
    struct conn *conn;

    conn = _conn_get(cb);
    if (conn == NULL) {
        return NULL;
    }

    log_debug(LOG_VVERB, "get conn %p client %d", conn, conn->sd);

    return conn;
}

static void
conn_free(struct conn *conn)
{
    log_debug(LOG_VVERB, "free conn %p", conn);

    if (conn == NULL) {
        return;
    }

    if (conn->sd > 0) {
        close(conn->sd);
        conn->sd = -1;
        update_curr_clients_sub(1);
    }

    if (conn->inqueue) {
        sds buf;
        while (buf = dlistPop(conn->inqueue)) {
            sdsfree(buf);
        }
        dlistRelease(conn->inqueue);
        conn->inqueue = NULL;
    }

    if (conn->outqueue) {
        sds buf;
        while (buf = dlistPop(conn->outqueue)) {
            sdsfree(buf);
        }
        dlistRelease(conn->outqueue);
        conn->outqueue = NULL;
    }
    
    dfree(conn);
}

void
conn_put(struct conn *conn)
{
    conn_base *cb = conn->cb;
    
    ASSERT(conn->owner == NULL);

    log_debug(LOG_VVERB, "put conn %p", conn);

    if (conn->sd > 0) {
        close(conn->sd);
        conn->sd = -1;
        update_curr_clients_sub(1);
    }

    if (cb == NULL) {
        conn_free(conn);
        return;
    }

    if (conn->inqueue) {
        sds buf;
        while (buf = dlistPop(conn->inqueue)) {
            sdsfree(buf);
        }
    }

    if (conn->outqueue) {
        sds buf;
        while (buf = dlistPop(conn->outqueue)) {
            sdsfree(buf);
        }
    }

    dlistPush(cb->free_connq, conn);
    cb->ncurr_cconn--;
    cb->ncurr_conn--;
}

int
conn_init(conn_base *cb)
{
    log_debug(LOG_DEBUG, "conn size %d", sizeof(struct conn));

    cb->free_connq = NULL;
    cb->ntotal_conn = 0;
    cb->ncurr_cconn = 0;
    cb->ncurr_cconn = 0;

    cb->free_connq = dlistCreate();
    if (cb->free_connq == NULL) {
        return VR_ENOMEM;
    }

    return VR_OK;
}

void
conn_deinit(conn_base *cb)
{
    struct conn *conn;

    if (cb->free_connq) {
        while (conn = dlistPop(cb->free_connq)) {
            conn_free(conn);
        }
        ASSERT(dlistLength(cb->free_connq) == 0);
        dlistRelease(cb->free_connq);
    }
}

ssize_t
conn_recv(struct conn *conn, void *buf, size_t size)
{
    ssize_t n;

    ASSERT(buf != NULL);
    ASSERT(size > 0);
    ASSERT(conn->recv_ready);

    for (;;) {
        n = vr_read(conn->sd, buf, size);

        log_debug(LOG_VERB, "recv on sd %d %zd of %zu", conn->sd, n, size);

        if (n > 0) {
            if (n < (ssize_t) size) {
                conn->recv_ready = 0;
            }
            conn->recv_bytes += (size_t)n;
            return n;
        }

        if (n == 0) {
            conn->recv_ready = 0;
            conn->eof = 1;
            log_debug(LOG_INFO, "recv on sd %d eof rb %zu sb %zu", conn->sd,
                      conn->recv_bytes, conn->send_bytes);
            return n;
        }

        if (errno == EINTR) {
            log_debug(LOG_VERB, "recv on sd %d not ready - eintr", conn->sd);
            continue;
        } else if (errno == EAGAIN || errno == EWOULDBLOCK) {
            conn->recv_ready = 0;
            log_debug(LOG_VERB, "recv on sd %d not ready - eagain", conn->sd);
            return VR_EAGAIN;
        } else {
            conn->recv_ready = 0;
            conn->err = errno;
            log_error("recv on sd %d failed: %s", conn->sd, strerror(errno));
            return VR_ERROR;
        }
    }

    NOT_REACHED();

    return VR_ERROR;
}

ssize_t
conn_send(struct conn *conn, void *buf, size_t nsend)
{
    ssize_t n;

    ASSERT(nsend != 0);
    ASSERT(conn->send_ready);

    for (;;) {
        n = vr_write(conn->sd, buf, nsend);

        log_debug(LOG_VERB, "send on sd %d %zd of %zu",
                  conn->sd, n, nsend);

        if (n > 0) {
            if (n < (ssize_t) nsend) {
                conn->send_ready = 0;
            }
            conn->send_bytes += (size_t)n;
            return n;
        }

        if (n == 0) {
            log_warn("send on sd %d returned zero", conn->sd);
            conn->send_ready = 0;
            return 0;
        }

        if (errno == EINTR) {
            log_debug(LOG_VERB, "send on sd %d not ready - eintr", conn->sd);
            continue;
        } else if (errno == EAGAIN || errno == EWOULDBLOCK) {
            conn->send_ready = 0;
            log_debug(LOG_VERB, "send on sd %d not ready - eagain", conn->sd);
            return VR_EAGAIN;
        } else {
            conn->send_ready = 0;
            conn->err = errno;
            log_error("send on sd %d failed: %s", conn->sd, strerror(errno));
            return VR_ERROR;
        }
    }

    NOT_REACHED();

    return VR_ERROR;
}

ssize_t
conn_sendv(struct conn *conn, struct darray *sendv, size_t nsend)
{
    ssize_t n;

    ASSERT(darray_n(sendv) > 0);
    ASSERT(nsend != 0);
    ASSERT(conn->send_ready);

    for (;;) {
        n = vr_writev(conn->sd, sendv->elem, sendv->nelem);

        log_debug(LOG_VERB, "sendv on sd %d %zd of %zu in %"PRIu32" buffers",
                  conn->sd, n, nsend, sendv->nelem);

        if (n > 0) {
            if (n < (ssize_t) nsend) {
                conn->send_ready = 0;
            }
            conn->send_bytes += (size_t)n;
            return n;
        }

        if (n == 0) {
            log_warn("sendv on sd %d returned zero", conn->sd);
            conn->send_ready = 0;
            return 0;
        }

        if (errno == EINTR) {
            log_debug(LOG_VERB, "sendv on sd %d not ready - eintr", conn->sd);
            continue;
        } else if (errno == EAGAIN || errno == EWOULDBLOCK) {
            conn->send_ready = 0;
            log_debug(LOG_VERB, "sendv on sd %d not ready - eagain", conn->sd);
            return VR_EAGAIN;
        } else {
            conn->send_ready = 0;
            conn->err = errno;
            log_error("sendv on sd %d failed: %s", conn->sd, strerror(errno));
            return VR_ERROR;
        }
    }

    NOT_REACHED();

    return VR_ERROR;
}


================================================
FILE: src/vr_connection.h
================================================
#ifndef _VR_CONNECTION_H_
#define _VR_CONNECTION_H_

typedef struct conn_base {
    dlist *free_connq;           /* free conn q */
    uint64_t ntotal_conn;       /* total # connections counter from start */
    uint32_t ncurr_conn;        /* current # connections */
    uint32_t ncurr_cconn;       /* current # client connections */
}conn_base;

struct conn {
    void                *owner;          /* connection owner */
    
    conn_base           *cb;             /* connect base */

    int                 sd;              /* socket descriptor */

    size_t              recv_bytes;      /* received (read) bytes */
    size_t              send_bytes;      /* sent (written) bytes */

    err_t               err;             /* connection errno */
    unsigned            recv_active:1;   /* recv active? */
    unsigned            recv_ready:1;    /* recv ready? */
    unsigned            send_active:1;   /* send active? */
    unsigned            send_ready:1;    /* send ready? */

    unsigned            connecting:1;    /* connecting? */
    unsigned            connected:1;     /* connected? */
    unsigned            eof:1;           /* eof? aka passive close? */
    unsigned            done:1;          /* done? aka close? */

    dlist                *inqueue;        /* incoming request queue */
    dlist                *outqueue;       /* outputing response queue */
};

struct conn *conn_get(conn_base *cb);
void conn_put(struct conn *conn);

int conn_init(conn_base *cb);
void conn_deinit(conn_base *cb);

ssize_t conn_recv(struct conn *conn, void *buf, size_t size);
ssize_t conn_send(struct conn *conn, void *buf, size_t nsend);
ssize_t conn_sendv(struct conn *conn, struct darray *sendv, size_t nsend);

#endif


================================================
FILE: src/vr_core.c
================================================
#include <stdlib.h>
#include <unistd.h>

#include <vr_core.h>

static uint32_t reserved_fds = 0;


================================================
FILE: src/vr_core.h
================================================
#ifndef _VR_CORE_H_
#define _VR_CORE_H_

#ifdef HAVE_CONFIG_H
# include <config.h>
#endif

#include <dspecialconfig.h>

#ifdef HAVE_STATS
# define VR_STATS 1
#else
# define VR_STATS 0
#endif

#ifdef HAVE_LITTLE_ENDIAN
# define VR_LITTLE_ENDIAN 1
#endif

#ifdef HAVE_BACKTRACE
# define VR_HAVE_BACKTRACE 1
#endif

#ifdef HAVE_SPINLOCK
# define VR_USE_SPINLOCK 1
#endif

#define VR_OK        0
#define VR_ERROR    -1
#define VR_EAGAIN   -2
#define VR_ENOMEM   -3

/* reserved fds for std streams, log, stats fd, epoll etc. */
#define RESERVED_FDS 32

typedef int rstatus_t; /* return type */
typedef int err_t;      /* error type */

typedef long long mstime_t; /* millisecond time type. */

struct instance;
struct darray;
struct conn;
struct client;
struct clientBufferLimitsConfig;
struct redisCommand;
struct vr_worker;

#include <stddef.h>
#include <stdint.h>
#include <inttypes.h>
#include <string.h>
#include <stdio.h>
#include <ctype.h>
#include <errno.h>
#include <limits.h>
#include <time.h>
#include <unistd.h>
#include <pthread.h>

#include <sys/types.h>
#include <sys/socket.h>
#include <sys/un.h>
#include <sys/time.h>
#include <sys/resource.h>
#include <netinet/in.h>

#include <ae.h>
#include <sds.h>
#include <dutil.h>
#include <dlog.h>
#include <dhashkit.h>
#include <dmalloc.h>
#include <darray.h>
#include <dlist.h>

#include <vr_util.h>
#include <vr_signal.h>

#include <vr_ziplist.h>
#include <vr_zipmap.h>
#include <vr_dict.h>
#include <vr_rbtree.h>
#include <vr_intset.h>
#include <vr_quicklist.h>

#include <vr_lzf.h>
#include <vr_lzfP.h>

#include <vr_object.h>

#include <vr_listen.h>
#include <vr_connection.h>

#include <vr_stats.h>
#include <vr_conf.h>

#include <vr_thread.h>
#include <vr_eventloop.h>
#include <vr_master.h>
#include <vr_worker.h>
#include <vr_backend.h>

#include <vr_db.h>
#include <vr_multi.h>

#include <vr_command.h>
#include <vr_block.h>
#include <vr_client.h>
#include <vr_server.h>

#include <vr_notify.h>
#include <vr_pubsub.h>

#include <vr_rdb.h>
#include <vr_aof.h>
#include <vr_replication.h>
#include <vr_scripting.h>

#include <vr_t_hash.h>
#include <vr_t_list.h>
#include <vr_t_set.h>
#include <vr_t_string.h>
#include <vr_t_zset.h>

#include <vr_bitops.h>

#include <vr_hyperloglog.h>

#include <vr_slowlog.h>

struct instance {
    int             log_level;                   /* log level */
    char            *log_filename;               /* log filename */
    char            *conf_filename;              /* configuration filename */
    char            hostname[VR_MAXHOSTNAMELEN]; /* hostname */
    size_t          mbuf_chunk_size;             /* mbuf chunk size */
    pid_t           pid;                         /* process id */
    char            *pid_filename;               /* pid filename */
    unsigned        pidfile:1;                   /* pid file created? */
    int             thread_num;                  /* the thread number */
};

#endif


================================================
FILE: src/vr_db.c
================================================
#include <signal.h>
#include <ctype.h>

#include <vr_core.h>

/* Db->dict, keys are sds strings, vals are Redis objects. */
dictType dbDictType = {
    dictSdsHash,                /* hash function */
    NULL,                       /* key dup */
    NULL,                       /* val dup */
    dictSdsKeyCompare,          /* key compare */
    dictSdsDestructor,          /* key destructor */
    dictObjectDestructor   /* val destructor */
};

/* Db->expires */
dictType keyptrDictType = {
    dictSdsHash,               /* hash function */
    NULL,                      /* key dup */
    NULL,                      /* val dup */
    dictSdsKeyCompare,         /* key compare */
    NULL,                      /* key destructor */
    NULL                       /* val destructor */
};

/* Keylist hash table type has unencoded redis objects as keys and
 * lists as values. It's used for blocking operations (BLPOP) and to
 * map swapped keys to a list of clients waiting for this keys to be loaded. */
dictType keylistDictType = {
    dictObjHash,                /* hash function */
    NULL,                       /* key dup */
    NULL,                       /* val dup */
    dictObjKeyCompare,          /* key compare */
    dictObjectDestructor,       /* key destructor */
    dictListDestructor          /* val destructor */
};

/* Create a new eviction pool. */
static struct evictionPoolEntry *evictionPoolAlloc(void) {
    struct evictionPoolEntry *ep;
    int j;

    ep = dalloc(sizeof(*ep)*MAXMEMORY_EVICTION_POOL_SIZE);
    for (j = 0; j < MAXMEMORY_EVICTION_POOL_SIZE; j++) {
        ep[j].idle = 0;
        ep[j].key = NULL;
    }
    return ep;
}

/*-----------------------------------------------------------------------------
 * C-level DB API
 *----------------------------------------------------------------------------*/

int redisDbInit(redisDb *db)
{
    db->dict = dictCreate(&dbDictType,NULL);
    db->expires = dictCreate(&keyptrDictType,NULL);
    db->blocking_keys = dictCreate(&keylistDictType,NULL);
    db->ready_keys = dictCreate(&setDictType,NULL);
    db->watched_keys = dictCreate(&keylistDictType,NULL);
    db->eviction_pool = evictionPoolAlloc();
    db->avg_ttl = 0;

    pthread_rwlock_init(&db->rwl, NULL);

    return VR_OK;
}

int 
redisDbDeinit(redisDb *db)
{
    pthread_rwlock_destroy(&db->rwl);
    return VR_OK;
}

int
lockDbRead(redisDb *db)
{
    pthread_rwlock_rdlock(&db->rwl);
    return VR_OK;
}

int
lockDbWrite(redisDb *db)
{
    pthread_rwlock_wrlock(&db->rwl);
    return VR_OK;
}

int
unlockDb(redisDb *db)
{
    pthread_rwlock_unlock(&db->rwl);
    return VR_OK;
}

robj *lookupKey(redisDb *db, robj *key) {
    dictEntry *de = dictFind(db->dict,key->ptr);
    if (de) {
        robj *val = dictGetVal(de);

        /* Update the access time for the ageing algorithm.
         * Don't do it if we have a saving child, as this will trigger
         * a copy on write madness. */
        if (server.rdb_child_pid == -1 && server.aof_child_pid == -1)
            //val->lru = LRU_CLOCK();
            val->lru = 0;
        return val;
    } else {
        return NULL;
    }
}

robj *lookupKeyRead(redisDb *db, robj *key) {
    if (checkIfExpired(db, key)) return NULL;
    return lookupKey(db,key);
}

robj *lookupKeyWrite(redisDb *db, robj *key, int *expired) {
    if (expired) *expired = expireIfNeeded(db,key);
    return lookupKey(db,key);
}

robj *lookupKeyReadOrReply(client *c, robj *key, robj *reply) {
    robj *o = lookupKeyRead(c->db, key);
    if (!o) addReply(c,reply);
    return o;
}

robj *lookupKeyWriteOrReply(client *c, robj *key, robj *reply, int *expired) {
    robj *o = lookupKeyWrite(c->db, key, expired);
    if (!o) addReply(c,reply);
    return o;
}

/* Add the key to the DB. It's up to the caller to increment the reference
 * counter of the value if needed.
 *
 * The program is aborted if the key already exists. 
 * Val object must be independent. */
void dbAdd(redisDb *db, robj *key, robj *val) {
    sds copy = sdsdup(key->ptr);
    int retval = dictAdd(db->dict, copy, val);
    serverAssertWithInfo(NULL,key,retval == DICT_OK);
    if (val->type == OBJ_LIST) signalListAsReady(db, key);
 }

/* Overwrite an existing key with a new value. Incrementing the reference
 * count of the new value is up to the caller.
 * This function does not modify the expire time of the existing key.
 *
 * The program is aborted if the key was not already present. 
 * Val object must be independent. */
void dbOverwrite(redisDb *db, robj *key, robj *val) {
    dictEntry *de = dictFind(db->dict,key->ptr);

    serverAssertWithInfo(NULL,key,de != NULL);
    dictReplace(db->dict, key->ptr, val);
}

/* High level Set operation. This function can be used in order to set
 * a key, whatever it was existing or not, to a new object.
 *
 * 1) Val object must be independent.
 * 2) Clients WATCHing for the destination key notified.
 * 3) The expire time of the key is reset (the key is made persistent). */
void setKey(redisDb *db, robj *key, robj *val, int *expired) {
    if (lookupKeyWrite(db,key,expired) == NULL) {
        dbAdd(db,key,val);
    } else {
        dbOverwrite(db,key,val);
    }
    
    removeExpire(db,key);
}

int dbExists(redisDb *db, robj *key) {
    return dictFind(db->dict,key->ptr) != NULL;
}

/* Return a random key, in form of a Redis object.
 * If there are no keys, NULL is returned.
 *
 * The function makes sure to return keys not already expired. */
robj *dbRandomKey(redisDb *db) {
    dictEntry *de;

    while(1) {
        sds key;
        robj *keyobj;

        lockDbRead(db);
        de = dictGetRandomKey(db->dict);
        if (de == NULL) {
            unlockDb(db);
            return NULL;
        }

        key = dictGetKey(de);
        keyobj = createStringObject(key,sdslen(key));
        if (dictFind(db->expires,key)) {
            if (checkIfExpired(db,keyobj)) {
                unlockDb(db);
                freeObject(keyobj);
                continue; /* search for another key. This expired. */
            }
        }
        unlockDb(db);
        return keyobj;
    }
}

/* Delete a key, value, and associated expiration entry if any, from the DB */
int dbDelete(redisDb *db, robj *key) {
    /* Deleting an entry from the expires dict will not free the sds of
     * the key, because it is shared with the main dictionary. */
    if (dictSize(db->expires) > 0) dictDelete(db->expires,key->ptr);
    if (dictDelete(db->dict,key->ptr) == DICT_OK) {
        return 1;
    } else {
        return 0;
    }
}

robj *dbUnshareStringValue(redisDb *db, robj *key, robj *o) {    
    ASSERT(o->type == OBJ_STRING);
    if (o->constant || o->encoding != OBJ_ENCODING_RAW) {
        robj *decoded, *new;
        decoded = getDecodedObject(o);
        new = createRawStringObject(decoded->ptr, sdslen(decoded->ptr));
        if (decoded != o) freeObject(decoded);
        dbOverwrite(db,key,new);
        return new;
    }
    return o;
}

long long emptyDb(void(callback)(void*)) {
    int j;
    long long removed = 0;
    redisDb *db;

    for (j = 0; j < server.dbnum; j++) {
        db = darray_get(&server.dbs, (uint32_t)j);
        removed += dictSize(db->dict);
        dictEmpty(db->dict,callback);
        dictEmpty(db->expires,callback);
    }
    
    return removed;
}

int selectDb(client *c, int id) {
    redisDb *db;
    
    if (id < 0 || id >= server.dblnum)
        return VR_ERROR;

    c->dictid = id;
    return VR_OK;
}

/*-----------------------------------------------------------------------------
 * Hooks for key space changes.
 *
 * Every time a key in the database is modified the function
 * signalModifiedKey() is called.
 *
 * Every time a DB is flushed the function signalFlushDb() is called.
 *----------------------------------------------------------------------------*/

void signalModifiedKey(redisDb *db, robj *key) {
    touchWatchedKey(db,key);
}

void signalFlushedDb(int dbid) {
    touchWatchedKeysOnFlush(dbid);
}

/*-----------------------------------------------------------------------------
 * Type agnostic commands operating on the key space
 *----------------------------------------------------------------------------*/

void flushdbCommand(client *c) {
    int idx;

    for (idx = 0; idx < server.dbinum; idx ++) {
        fetchInternalDbById(c, idx);
        lockDbWrite(c->db);
        c->vel->dirty += dictSize(c->db->dict);
        signalFlushedDb(c->db->id);
        dictEmpty(c->db->dict,NULL);
        dictEmpty(c->db->expires,NULL);
        unlockDb(c->db);
    }

    addReply(c,shared.ok);
}

void flushallCommand(client *c) {
    int idx;
    redisDb *db;

    for (idx = 0; idx < server.dbnum; idx ++) {
        db = darray_get(&server.dbs, (uint32_t)idx);
        lockDbWrite(db);
        dictEmpty(db->dict,NULL);
        dictEmpty(db->expires,NULL);
        unlockDb(db);
    }

    addReply(c,shared.ok);
}

void delCommand(client *c) {
    int deleted = 0, j;
    int expired = 0;

    for (j = 1; j < c->argc; j++) {
        fetchInternalDbByKey(c, c->argv[j]);
        lockDbWrite(c->db);
        expired += expireIfNeeded(c->db,c->argv[j]);
        if (dbDelete(c->db,c->argv[j])) {
            signalModifiedKey(c->db,c->argv[j]);
            notifyKeyspaceEvent(NOTIFY_GENERIC,
                "del",c->argv[j],c->db->id);
            c->vel->dirty++;
            deleted++;
        }
        unlockDb(c->db);
    }
    addReplyLongLong(c,deleted);

    if (expired > 0) {
        update_stats_add(c->vel->stats, expiredkeys, expired);
    }
}

/* EXISTS key1 key2 ... key_N.
 * Return value is the number of keys existing. */
void existsCommand(client *c) {
    long long count = 0;
    int j;

    for (j = 1; j < c->argc; j++) {
        fetchInternalDbByKey(c,c->argv[j]);
        lockDbRead(c->db);
        if (checkIfExpired(c->db,c->argv[j])) {
            unlockDb(c->db);
            continue;
        }
        if (dbExists(c->db,c->argv[j])) count++;
        unlockDb(c->db);
    }
    addReplyLongLong(c,count);

    update_stats_add(c->vel->stats, keyspace_hits, count);
    update_stats_add(c->vel->stats, keyspace_misses, c->argc-1-count);
}

void selectCommand(client *c) {
    long id;

    if (getLongFromObjectOrReply(c, c->argv[1], &id,
        "invalid DB index") != VR_OK)
        return;

    if (selectDb(c,id) == VR_ERROR) {
        addReplyError(c,"invalid DB index");
    } else {
        addReply(c,shared.ok);
    }
}

void randomkeyCommand(client *c) {
    robj *key;
    int idx, retry_count = 0;

    idx = random()%server.dbinum;

retry:
    fetchInternalDbById(c, idx);
    if ((key = dbRandomKey(c->db)) == NULL) {
        if (retry_count++ < server.dbinum) {
            if (++idx >= server.dbinum) {
                idx = 0;
            }
            goto retry;
        }

        addReply(c,shared.nullbulk);
        return;
    }

    addReplyBulk(c,key);
    freeObject(key);
}

void keysCommand(client *c) {
    dictIterator *di;
    dictEntry *de;
    sds pattern = c->argv[1]->ptr;
    int plen = sdslen(pattern), allkeys;
    unsigned long numkeys = 0;
    void *replylen;
    int idx;
    long long keys_count = 0;
    unsigned long expired = 0;
    long long max_time_complexity_limit;

    /* Check if it is reach the max-time-complexity-limit */
    for (idx = 0; idx < server.dbinum; idx ++) {
        fetchInternalDbById(c, idx);
        lockDbWrite(c->db);
        keys_count += dictSize(c->db->dict);
        unlockDb(c->db);
    }

    max_time_complexity_limit = c->vel->cc.max_time_complexity_limit;
    if (max_time_complexity_limit && 
        keys_count > max_time_complexity_limit) {
        addReply(c,shared.outofcomplexitylimit);
        return;
    }

    replylen = addDeferredMultiBulkLength(c);
    for (idx = 0; idx < server.dbinum; idx ++) {
        fetchInternalDbById(c,idx);
        lockDbWrite(c->db);
        di = dictGetSafeIterator(c->db->dict);
        allkeys = (pattern[0] == '*' && pattern[1] == '\0');
        while((de = dictNext(di)) != NULL) {
            sds key = dictGetKey(de);
            robj *keyobj;

            if (allkeys || stringmatchlen(pattern,plen,key,sdslen(key),0)) {
                keyobj = createStringObject(key,sdslen(key));
                if (expireIfNeeded(c->db,keyobj) == 0) {
                    addReplyBulk(c,keyobj);
                    numkeys++;
                } else {
                    expired ++;
                }
                freeObject(keyobj);
            }
        }
        dictReleaseIterator(di);
        unlockDb(c->db);
    }
    setDeferredMultiBulkLength(c,replylen,numkeys);
}

/* This callback is used by scanGenericCommand in order to collect elements
 * returned by the dictionary iterator into a list. */
void scanCallback(void *privdata, const dictEntry *de) {
    void **pd = (void**) privdata;
    dlist *keys = pd[0];
    robj *o = pd[1];
    robj *key, *val = NULL;

    if (o == NULL) {
        sds sdskey = dictGetKey(de);
        key = createStringObject(sdskey, sdslen(sdskey));
    } else if (o->type == OBJ_SET) {
        key = dictGetKey(de);
        key = dupStringObjectUnconstant(key);
    } else if (o->type == OBJ_HASH) {
        key = dictGetKey(de);
        key = dupStringObjectUnconstant(key);
        val = dictGetVal(de);
        val = dupStringObjectUnconstant(val);
    } else if (o->type == OBJ_ZSET) {
        key = dictGetKey(de);
        key = dupStringObjectUnconstant(key);
        val = createStringObjectFromLongDouble(*(double*)dictGetVal(de),0);
    } else {
        serverPanic("Type not handled in SCAN callback.");
    }

    dlistAddNodeTail(keys, key);
    if (val) dlistAddNodeTail(keys, val);
}

/* Try to parse a SCAN cursor stored at object 'o':
 * if the cursor is valid, store it as unsigned integer into *cursor and
 * returns VR_OK. Otherwise return VR_ERROR and send an error to the
 * client. */
int parseScanCursorOrReply(client *c, robj *o, unsigned long *cursor) {
    char *eptr;

    /* Use strtoul() because we need an *unsigned* long, so
     * getLongLongFromObject() does not cover the whole cursor space. */
    errno = 0;
    *cursor = strtoul(o->ptr, &eptr, 10);
    if (isspace(((char*)o->ptr)[0]) || eptr[0] != '\0' || errno == ERANGE)
    {
        addReplyError(c, "invalid cursor");
        return VR_ERROR;
    }
    return VR_OK;
}

/* This command implements SCAN, HSCAN and SSCAN commands.
 * If object 'o' is passed, then it must be a Hash or Set object, otherwise
 * if 'o' is NULL the command will operate on the dictionary associated with
 * the current database.
 *
 * When 'o' is not NULL the function assumes that the first argument in
 * the client arguments vector is a key so it skips it before iterating
 * in order to parse options.
 *
 * In the case of a Hash object the function returns both the field and value
 * of every element on the Hash. */
void scanGenericCommand(client *c, int scantype) {
    int i, j;
    dlist *keys = dlistCreate();
    dlistNode *node, *nextnode;
    long count = 10;
    sds pat = NULL;
    int patlen = 0, use_pattern = 0;
    unsigned long cursor;
    robj *o;
    dict *ht;

    /* Set i to the first option argument. The previous one is the cursor. */
    i = (scantype == SCAN_TYPE_KEY) ? 2 : 3; /* Skip the key argument if needed. */
    if (parseScanCursorOrReply(c,c->argv[i-1],&cursor) == VR_ERROR) return;

    /* Step 1: Parse options. */
    while (i < c->argc) {
        j = c->argc - i;
        if (!strcasecmp(c->argv[i]->ptr, "count") && j >= 2) {
            if (getLongFromObjectOrReply(c, c->argv[i+1], &count, NULL)
                != VR_OK)
            {
                goto cleanup;
            }

            if (count < 1) {
                addReply(c,shared.syntaxerr);
                goto cleanup;
            }

            i += 2;
        } else if (!strcasecmp(c->argv[i]->ptr, "match") && j >= 2) {
            pat = c->argv[i+1]->ptr;
            patlen = sdslen(pat);

            /* The pattern always matches if it is exactly "*", so it is
             * equivalent to disabling it. */
            use_pattern = !(pat[0] == '*' && patlen == 1);

            i += 2;
        } else {
            addReply(c,shared.syntaxerr);
            goto cleanup;
        }
    }

    if (scantype == SCAN_TYPE_KEY) {
        o = NULL;
        if (c->scanid == -1 || cursor == 0) c->scanid = 0;
        fetchInternalDbById(c, c->scanid);
        lockDbRead(c->db);
    } else if (scantype == SCAN_TYPE_HASH || 
        scantype == SCAN_TYPE_SET ||
        scantype == SCAN_TYPE_ZSET) {
        fetchInternalDbByKey(c, c->argv[1]);
        lockDbRead(c->db);
        if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.emptyscan)) == NULL) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_misses, 1);
            return;
        }
    }

    switch (scantype) {
    case SCAN_TYPE_KEY:
        ASSERT(o == NULL);
        break;
    case SCAN_TYPE_HASH:
        if (checkType(c,o,OBJ_HASH)) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            return;
        }
        break;
    case SCAN_TYPE_SET:
        if (checkType(c,o,OBJ_SET)) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            return;
        }
        break;
    case SCAN_TYPE_ZSET:
        if (checkType(c,o,OBJ_ZSET)) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            return;
        }
        break;
    }

    /* Object must be NULL (to iterate keys names), or the type of the object
     * must be Set, Sorted Set, or Hash. */
    ASSERT(o == NULL || o->type == OBJ_SET || o->type == OBJ_HASH ||
                o->type == OBJ_ZSET);

scan_retry:
    
    /* Step 2: Iterate the collection.
     *
     * Note that if the object is encoded with a ziplist, intset, or any other
     * representation that is not a hash table, we are sure that it is also
     * composed of a small number of elements. So to avoid taking state we
     * just return everything inside the object in a single call, setting the
     * cursor to zero to signal the end of the iteration. */

    /* Handle the case of a hash table. */
    ht = NULL;
    if (scantype == SCAN_TYPE_KEY) {
        ht = c->db->dict;
    } else if (o->type == OBJ_SET && o->encoding == OBJ_ENCODING_HT) {
        ht = o->ptr;
    } else if (o->type == OBJ_HASH && o->encoding == OBJ_ENCODING_HT) {
        ht = o->ptr;
        count *= 2; /* We return key / value for this type. */
    } else if (o->type == OBJ_ZSET && o->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = o->ptr;
        ht = zs->dict;
        count *= 2; /* We return key / value for this type. */
    }

    if (ht) {
        void *privdata[2];
        /* We set the max number of iterations to ten times the specified
         * COUNT, so if the hash table is in a pathological state (very
         * sparsely populated) we avoid to block too much time at the cost
         * of returning no or very few elements. */
        long maxiterations = count*10;

        /* We pass two pointers to the callback: the list to which it will
         * add new elements, and the object containing the dictionary so that
         * it is possible to fetch more data in a type-dependent way. */
        privdata[0] = keys;
        privdata[1] = o;
        do {
            cursor = dictScan(ht, cursor, scanCallback, privdata);
        } while (cursor &&
              maxiterations-- &&
              dlistLength(keys) < (unsigned long)count);
    } else if (o->type == OBJ_SET) {
        int pos = 0;
        int64_t ll;

        while(intsetGet(o->ptr,pos++,&ll))
            dlistAddNodeTail(keys,createStringObjectFromLongLong(ll));
        cursor = 0;
    } else if (o->type == OBJ_HASH || o->type == OBJ_ZSET) {
        unsigned char *p = ziplistIndex(o->ptr,0);
        unsigned char *vstr;
        unsigned int vlen;
        long long vll;

        while(p) {
            ziplistGet(p,&vstr,&vlen,&vll);
            dlistAddNodeTail(keys,
                (vstr != NULL) ? createStringObject((char*)vstr,vlen) :
                                 createStringObjectFromLongLong(vll));
            p = ziplistNext(o->ptr,p);
        }
        cursor = 0;
    } else {
        serverPanic("Not handled encoding in SCAN.");
    }

    unlockDb(c->db);
    if (scantype == SCAN_TYPE_KEY) {
        if (cursor == 0) {
            if (c->scanid < (server.dbinum - 1)) {
                c->scanid ++;
                fetchInternalDbById(c, c->scanid);
                lockDbRead(c->db);
                goto scan_retry;
            } else {
                c->scanid = -1;
            }
        }
    } else if (scantype == SCAN_TYPE_HASH || 
        scantype == SCAN_TYPE_SET ||
        scantype == SCAN_TYPE_ZSET) {
        update_stats_add(c->vel->stats, keyspace_hits, 1);
    }

    /* Step 3: Filter elements. */
    node = dlistFirst(keys);
    while (node) {
        robj *kobj = dlistNodeValue(node);
        nextnode = dlistNextNode(node);
        int filter = 0;

        /* Filter element if it does not match the pattern. */
        if (!filter && use_pattern) {
            if (sdsEncodedObject(kobj)) {
                if (!stringmatchlen(pat, patlen, kobj->ptr, sdslen(kobj->ptr), 0))
                    filter = 1;
            } else {
                char buf[LONG_STR_SIZE];
                int len;

                ASSERT(kobj->encoding == OBJ_ENCODING_INT);
                len = ll2string(buf,sizeof(buf),(long)kobj->ptr);
                if (!stringmatchlen(pat, patlen, buf, len, 0)) filter = 1;
            }
        }

        /* Filter element if it is an expired key. */
        if (!filter && o == NULL && checkIfExpired(c->db,kobj)) filter = 1;

        /* Remove the element and its associted value if needed. */
        if (filter) {
            freeObject(kobj);
            dlistDelNode(keys, node);
        }

        /* If this is a hash or a sorted set, we have a flat list of
         * key-value elements, so if this element was filtered, remove the
         * value, or skip it if it was not filtered: we only match keys. */
        if (o && (o->type == OBJ_ZSET || o->type == OBJ_HASH)) {
            node = nextnode;
            nextnode = dlistNextNode(node);
            if (filter) {
                kobj = dlistNodeValue(node);
                freeObject(kobj);
                dlistDelNode(keys, node);
            }
        }
        node = nextnode;
    }

    /* Step 4: Reply to the client. */
    addReplyMultiBulkLen(c, 2);
    addReplyBulkLongLong(c,cursor);

    addReplyMultiBulkLen(c, dlistLength(keys));
    while ((node = dlistFirst(keys)) != NULL) {
        robj *kobj = dlistNodeValue(node);
        addReplyBulk(c, kobj);
        freeObject(kobj);
        dlistDelNode(keys, node);
    }

cleanup:
    dlistSetFreeMethod(keys,freeObjectVoid);
    dlistRelease(keys);
}

/* The SCAN command completely relies on scanGenericCommand. */
void scanCommand(client *c) {
    scanGenericCommand(c,SCAN_TYPE_KEY);
}

void dbsizeCommand(client *c) {
    int idx;
    unsigned long count = 0;

    for (idx = 0; idx < server.dbinum; idx ++) {
        fetchInternalDbById(c, idx);
        lockDbRead(c->db);
        count += dictSize(c->db->dict);
        unlockDb(c->db);
    }
    
    addReplyLongLong(c,count);
}

void lastsaveCommand(client *c) {
    addReplyLongLong(c,server.lastsave);
}

void typeCommand(client *c) {
    robj *o;
    char *type;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    o = lookupKeyRead(c->db,c->argv[1]);
    if (o == NULL) {
        type = "none";
        unlockDb(c->db);
        addReplyStatus(c,type);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else {
        switch(o->type) {
        case OBJ_STRING: type = "string"; break;
        case OBJ_LIST: type = "list"; break;
        case OBJ_SET: type = "set"; break;
        case OBJ_ZSET: type = "zset"; break;
        case OBJ_HASH: type = "hash"; break;
        default: type = "unknown"; break;
        }
    }

    unlockDb(c->db);
    addReplyStatus(c,type);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void shutdownCommand(client *c) {
    int flags = 0;

    if (c->argc > 2) {
        addReply(c,shared.syntaxerr);
        return;
    } else if (c->argc == 2) {
        if (!strcasecmp(c->argv[1]->ptr,"nosave")) {
            flags |= SHUTDOWN_NOSAVE;
        } else if (!strcasecmp(c->argv[1]->ptr,"save")) {
            flags |= SHUTDOWN_SAVE;
        } else {
            addReply(c,shared.syntaxerr);
            return;
        }
    }
    /* When SHUTDOWN is called while the server is loading a dataset in
     * memory we need to make sure no attempt is performed to save
     * the dataset on shutdown (otherwise it could overwrite the current DB
     * with half-read data).
     *
     * Also when in Sentinel mode clear the SAVE flag and force NOSAVE. */
    if (server.loading)
        flags = (flags & ~SHUTDOWN_SAVE) | SHUTDOWN_NOSAVE;
    //if (prepareForShutdown(flags) == VR_OK) exit(0);
    addReplyError(c,"Errors trying to SHUTDOWN. Check logs.");
}

void renameGenericCommand(client *c, int nx) {
    robj *o;
    long long expire;
    int samekey = 0;

    /* When source and dest key is the same, no operation is performed,
     * if the key exists, however we still return an error on unexisting key. */
    if (sdscmp(c->argv[1]->ptr,c->argv[2]->ptr) == 0) samekey = 1;

    if ((o = lookupKeyWriteOrReply(c,c->argv[1],shared.nokeyerr,NULL)) == NULL)
        return;

    if (samekey) {
        addReply(c,nx ? shared.czero : shared.ok);
        return;
    }

    incrRefCount(o);
    expire = getExpire(c->db,c->argv[1]);
    if (lookupKeyWrite(c->db,c->argv[2],NULL) != NULL) {
        if (nx) {
            decrRefCount(o);
            addReply(c,shared.czero);
            return;
        }
        /* Overwrite: delete the old key before creating the new one
         * with the same name. */
        dbDelete(c->db,c->argv[2]);
    }
    dbAdd(c->db,c->argv[2],o);
    if (expire != -1) setExpire(c->db,c->argv[2],expire);
    dbDelete(c->db,c->argv[1]);
    signalModifiedKey(c->db,c->argv[1]);
    signalModifiedKey(c->db,c->argv[2]);
    notifyKeyspaceEvent(NOTIFY_GENERIC,"rename_from",
        c->argv[1],c->db->id);
    notifyKeyspaceEvent(NOTIFY_GENERIC,"rename_to",
        c->argv[2],c->db->id);
    server.dirty++;
    addReply(c,nx ? shared.cone : shared.ok);
}

void renameCommand(client *c) {
    renameGenericCommand(c,0);
}

void renamenxCommand(client *c) {
    renameGenericCommand(c,1);
}

void moveCommand(client *c) {
    robj *o;
    redisDb *src, *dst;
    int srcid;
    long long dbid, expire;

    /* Obtain source and target DB pointers */
    src = c->db;
    srcid = c->db->id;

    if (getLongLongFromObject(c->argv[2],&dbid) == VR_ERROR ||
        dbid < INT_MIN || dbid > INT_MAX ||
        selectDb(c,dbid) == VR_ERROR)
    {
        addReply(c,shared.outofrangeerr);
        return;
    }
    dst = c->db;
    selectDb(c,srcid); /* Back to the source DB */

    /* If the user is moving using as target the same
     * DB as the source DB it is probably an error. */
    if (src == dst) {
        addReply(c,shared.sameobjecterr);
        return;
    }

    /* Check if the element exists and get a reference */
    o = lookupKeyWrite(c->db,c->argv[1],NULL);
    if (!o) {
        addReply(c,shared.czero);
        return;
    }
    expire = getExpire(c->db,c->argv[1]);

    /* Return zero if the key already exists in the target DB */
    if (lookupKeyWrite(dst,c->argv[1],NULL) != NULL) {
        addReply(c,shared.czero);
        return;
    }
    dbAdd(dst,c->argv[1],o);
    if (expire != -1) setExpire(dst,c->argv[1],expire);
    incrRefCount(o);

    /* OK! key moved, free the entry in the source DB */
    dbDelete(src,c->argv[1]);
    server.dirty++;
    addReply(c,shared.cone);
}

/*-----------------------------------------------------------------------------
 * Expires API
 *----------------------------------------------------------------------------*/

int removeExpire(redisDb *db, robj *key) {
    /* An expire may only be removed if there is a corresponding entry in the
     * main dict. Otherwise, the key will never be freed. */
    serverAssertWithInfo(NULL,key,dictFind(db->dict,key->ptr) != NULL);
    return dictDelete(db->expires,key->ptr) == DICT_OK;
}

void setExpire(redisDb *db, robj *key, long long when) {
    dictEntry *kde, *de;

    /* Reuse the sds from the main dict in the expire dict */
    kde = dictFind(db->dict,key->ptr);
    serverAssertWithInfo(NULL,key,kde != NULL);
    de = dictReplaceRaw(db->expires,dictGetKey(kde));
    dictSetSignedIntegerVal(de,when);
}

/* Return the expire time of the specified key, or -1 if no expire
 * is associated with this key (i.e. the key is non volatile) */
long long getExpire(redisDb *db, robj *key) {
    dictEntry *de;

    /* No expire? return ASAP */
    if (dictSize(db->expires) == 0 ||
       (de = dictFind(db->expires,key->ptr)) == NULL) return -1;

    /* The entry was found in the expire dict, this means it should also
     * be present in the main dict (safety check). */
    serverAssertWithInfo(NULL,key,dictFind(db->dict,key->ptr) != NULL);
    return dictGetSignedIntegerVal(de);
}

/* Propagate expires into slaves and the AOF file.
 * When a key expires in the master, a DEL operation for this key is sent
 * to all the slaves and the AOF file if enabled.
 *
 * This way the key expiry is centralized in one place, and since both
 * AOF and the master->slave link guarantee operation ordering, everything
 * will be consistent even if we allow write operations against expiring
 * keys. */
void propagateExpire(redisDb *db, robj *key) {
    robj *argv[2];

    argv[0] = shared.del;
    argv[1] = key;
    incrRefCount(argv[0]);
    incrRefCount(argv[1]);

    if (server.aof_state != AOF_OFF)
        feedAppendOnlyFile(server.delCommand,db->id,argv,2);
    replicationFeedSlaves(repl.slaves,db->id,argv,2);

    decrRefCount(argv[0]);
    decrRefCount(argv[1]);
}

/* Check if the key exists in the db and had expired */
int checkIfExpired(redisDb *db, robj *key) {
    long long when;

    when = getExpire(db,key);
    if (when > 0 && vr_msec_now() > when) {
        return 1;
    }

    return 0;
}

int expireIfNeeded(redisDb *db, robj *key) {
    long long when = getExpire(db,key);
    long long now;

    if (when < 0) return 0; /* No expire for this key */

    /* Don't expire anything while loading. It will be done later. */
    if (server.loading) return 0;

    /* If we are in the context of a Lua script, we claim that time is
     * blocked to when the Lua script started. This way a key can expire
     * only the first time it is accessed and not in the middle of the
     * script execution, making propagation to slaves / AOF consistent.
     * See issue #1525 on Github for more information. */
    now = server.lua_caller ? server.lua_time_start : vr_msec_now();

    /* If we are running in the context of a slave, return ASAP:
     * the slave key expiration is controlled by the master that will
     * send us synthesized DEL operations for expired keys.
     *
     * Still we try to return the right information to the caller,
     * that is, 0 if we think the key should be still valid, 1 if
     * we think the key is expired at this time. */
    if (repl.masterhost != NULL) return now > when;

    /* Return when this key has not expired */
    if (now <= when) return 0;

    /* Delete the key */
    //propagateExpire(db,key);
    notifyKeyspaceEvent(NOTIFY_EXPIRED,
        "expired",key,db->id);
    return dbDelete(db,key);
}

/*-----------------------------------------------------------------------------
 * Expires Commands
 *----------------------------------------------------------------------------*/

/* This is the generic command implementation for EXPIRE, PEXPIRE, EXPIREAT
 * and PEXPIREAT. Because the commad second argument may be relative or absolute
 * the "basetime" argument is used to signal what the base time is (either 0
 * for *AT variants of the command, or the current time for relative expires).
 *
 * unit is either UNIT_SECONDS or UNIT_MILLISECONDS, and is only used for
 * the argv[2] parameter. The basetime is always specified in milliseconds. */
void expireGenericCommand(client *c, long long basetime, int unit) {
    robj *key = c->argv[1], *param = c->argv[2];
    long long when; /* unix time in milliseconds when the key will expire. */
    int expired = 0;

    if (getLongLongFromObjectOrReply(c, param, &when, NULL) != VR_OK)
        return;

    if (unit == UNIT_SECONDS) when *= 1000;
    when += basetime;

    fetchInternalDbByKey(c, key);
    lockDbWrite(c->db);
    /* No key, return zero. */
    if (lookupKeyWrite(c->db,key,&expired) == NULL) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        addReply(c,shared.czero);
        return;
    }

    /* EXPIRE with negative TTL, or EXPIREAT with a timestamp into the past
     * should never be executed as a DEL when load the AOF or in the context
     * of a slave instance.
     *
     * Instead we take the other branch of the IF statement setting an expire
     * (possibly in the past) and wait for an explicit DEL from the master. */
    if (when <= vr_msec_now() && !server.loading && !repl.masterhost) {
        robj *aux;

        serverAssertWithInfo(c,key,dbDelete(c->db,key));
        c->vel->dirty++;

        /* Replicate/AOF this as an explicit DEL. */
        aux = dupStringObjectUnconstant(key);
        rewriteClientCommandVector(c,2,shared.del,aux);
        signalModifiedKey(c->db,key);
        notifyKeyspaceEvent(NOTIFY_GENERIC,"del",key,c->db->id);
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        addReply(c, shared.cone);
        return;
    } else {
        setExpire(c->db,key,when);
        addReply(c,shared.cone);
        signalModifiedKey(c->db,key);
        notifyKeyspaceEvent(NOTIFY_GENERIC,"expire",key,c->db->id);
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        c->vel->dirty++;
        return;
    }
}

void expireCommand(client *c) {
    expireGenericCommand(c,vr_msec_now(),UNIT_SECONDS);
}

void expireatCommand(client *c) {
    expireGenericCommand(c,0,UNIT_SECONDS);
}

void pexpireCommand(client *c) {
    expireGenericCommand(c,vr_msec_now(),UNIT_MILLISECONDS);
}

void pexpireatCommand(client *c) {
    expireGenericCommand(c,0,UNIT_MILLISECONDS);
}

void ttlGenericCommand(client *c, int output_ms) {
    long long expire, ttl = -1;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    /* If the key does not exist at all, return -2 */
    if (lookupKeyRead(c->db,c->argv[1]) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        addReplyLongLong(c,-2);
        return;
    }
    /* The key exists. Return -1 if it has no expire, or the actual
     * TTL value otherwise. */
    expire = getExpire(c->db,c->argv[1]);
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
    
    if (expire != -1) {
        ttl = expire-vr_msec_now();
        if (ttl < 0) ttl = 0;
    }
    if (ttl == -1) {
        addReplyLongLong(c,-1);
    } else {
        addReplyLongLong(c,output_ms ? ttl : ((ttl+500)/1000));
    }
}

void ttlCommand(client *c) {
    ttlGenericCommand(c, 0);
}

void pttlCommand(client *c) {
    ttlGenericCommand(c, 1);
}

void persistCommand(client *c) {
    dictEntry *de;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    de = dictFind(c->db->dict,c->argv[1]->ptr);
    if (de == NULL) {
        addReply(c,shared.czero);
    } else {
        if (removeExpire(c->db,c->argv[1])) {
            addReply(c,shared.cone);
            c->vel->dirty++;
        } else {
            addReply(c,shared.czero);
        }
    }
    unlockDb(c->db);
}

/* -----------------------------------------------------------------------------
 * API to get key arguments from commands
 * ---------------------------------------------------------------------------*/

/* The base case is to use the keys position as given in the command table
 * (firstkey, lastkey, step). */
int *getKeysUsingCommandTable(struct redisCommand *cmd,robj **argv, int argc, int *numkeys) {
    int j, i = 0, last, *keys;
    UNUSED(argv);

    if (cmd->firstkey == 0) {
        *numkeys = 0;
        return NULL;
    }
    last = cmd->lastkey;
    if (last < 0) last = argc+last;
    keys = dalloc(sizeof(int)*((last - cmd->firstkey)+1));
    for (j = cmd->firstkey; j <= last; j += cmd->keystep) {
        ASSERT(j < argc);
        keys[i++] = j;
    }
    *numkeys = i;
    return keys;
}

/* Return all the arguments that are keys in the command passed via argc / argv.
 *
 * The command returns the positions of all the key arguments inside the array,
 * so the actual return value is an heap allocated array of integers. The
 * length of the array is returned by reference into *numkeys.
 *
 * 'cmd' must be point to the corresponding entry into the redisCommand
 * table, according to the command name in argv[0].
 *
 * This function uses the command table if a command-specific helper function
 * is not required, otherwise it calls the command-specific function. */
int *getKeysFromCommand(struct redisCommand *cmd, robj **argv, int argc, int *numkeys) {
    if (cmd->getkeys_proc) {
        return cmd->getkeys_proc(cmd,argv,argc,numkeys);
    } else {
        return getKeysUsingCommandTable(cmd,argv,argc,numkeys);
    }
}

/* Free the result of getKeysFromCommand. */
void getKeysFreeResult(int *result) {
    dfree(result);
}

/* Helper function to extract keys from following commands:
 * ZUNIONSTORE <destkey> <num-keys> <key> <key> ... <key> <options>
 * ZINTERSTORE <destkey> <num-keys> <key> <key> ... <key> <options> */
int *zunionInterGetKeys(struct redisCommand *cmd, robj **argv, int argc, int *numkeys) {
    int i, num, *keys;
    UNUSED(cmd);

    num = atoi(argv[2]->ptr);
    /* Sanity check. Don't return any key if the command is going to
     * reply with syntax error. */
    if (num > (argc-3)) {
        *numkeys = 0;
        return NULL;
    }

    /* Keys in z{union,inter}store come from two places:
     * argv[1] = storage key,
     * argv[3...n] = keys to intersect */
    keys = dalloc(sizeof(int)*(num+1));

    /* Add all key positions for argv[3...n] to keys[] */
    for (i = 0; i < num; i++) keys[i] = 3+i;

    /* Finally add the argv[1] key position (the storage key target). */
    keys[num] = 1;
    *numkeys = num+1;  /* Total keys = {union,inter} keys + storage key */
    return keys;
}

/* Helper function to extract keys from the following commands:
 * EVAL <script> <num-keys> <key> <key> ... <key> [more stuff]
 * EVALSHA <script> <num-keys> <key> <key> ... <key> [more stuff] */
int *evalGetKeys(struct redisCommand *cmd, robj **argv, int argc, int *numkeys) {
    int i, num, *keys;
    UNUSED(cmd);

    num = atoi(argv[2]->ptr);
    /* Sanity check. Don't return any key if the command is going to
     * reply with syntax error. */
    if (num > (argc-3)) {
        *numkeys = 0;
        return NULL;
    }

    keys = dalloc(sizeof(int)*num);
    *numkeys = num;

    /* Add all key positions for argv[3...n] to keys[] */
    for (i = 0; i < num; i++) keys[i] = 3+i;

    return keys;
}

/* Helper function to extract keys from the SORT command.
 *
 * SORT <sort-key> ... STORE <store-key> ...
 *
 * The first argument of SORT is always a key, however a list of options
 * follow in SQL-alike style. Here we parse just the minimum in order to
 * correctly identify keys in the "STORE" option. */
int *sortGetKeys(struct redisCommand *cmd, robj **argv, int argc, int *numkeys) {
    int i, j, num, *keys, found_store = 0;
    UNUSED(cmd);

    num = 0;
    keys = dalloc(sizeof(int)*2); /* Alloc 2 places for the worst case. */

    keys[num++] = 1; /* <sort-key> is always present. */

    /* Search for STORE option. By default we consider options to don't
     * have arguments, so if we find an unknown option name we scan the
     * next. However there are options with 1 or 2 arguments, so we
     * provide a list here in order to skip the right number of args. */
    struct {
        char *name;
        int skip;
    } skiplist[] = {
        {"limit", 2},
        {"get", 1},
        {"by", 1},
        {NULL, 0} /* End of elements. */
    };

    for (i = 2; i < argc; i++) {
        for (j = 0; skiplist[j].name != NULL; j++) {
            if (!strcasecmp(argv[i]->ptr,skiplist[j].name)) {
                i += skiplist[j].skip;
                break;
            } else if (!strcasecmp(argv[i]->ptr,"store") && i+1 < argc) {
                /* Note: we don't increment "num" here and continue the loop
                 * to be sure to process the *last* "STORE" option if multiple
                 * ones are provided. This is same behavior as SORT. */
                found_store = 1;
                keys[num] = i+1; /* <store-key> */
                break;
            }
        }
    }
    *numkeys = num + found_store;
    return keys;
}

int *migrateGetKeys(struct redisCommand *cmd, robj **argv, int argc, int *numkeys) {
    int i, num, first, *keys;
    UNUSED(cmd);

    /* Assume the obvious form. */
    first = 3;
    num = 1;

    /* But check for the extended one with the KEYS option. */
    if (argc > 6) {
        for (i = 6; i < argc; i++) {
            if (!strcasecmp(argv[i]->ptr,"keys") &&
                sdslen(argv[3]->ptr) == 0)
            {
                first = i+1;
                num = argc-first;
                break;
            }
        }
    }

    keys = dalloc(sizeof(int)*num);
    for (i = 0; i < num; i++) keys[i] = first+i;
    *numkeys = num;
    return keys;
}

int fetchInternalDbByKey(client *c, robj *key) {
    c->db = darray_get(&server.dbs, (hash_crc16(key->ptr,stringObjectLen(key))&0x3FFF)%server.dbinum+c->dictid*server.dbinum);
    return VR_OK;
}

int fetchInternalDbById(client *c, int idx) {
    c->db = darray_get(&server.dbs, idx+c->dictid*server.dbinum);
    return VR_OK;
}

/* If the percentage of used slots in the HT reaches HASHTABLE_MIN_FILL
 * we resize the hash table to save memory */
void tryResizeHashTablesForDb(int dbid) {
    redisDb *db;

    db = darray_get(&server.dbs, dbid);
    lockDbWrite(db);
    if (htNeedsResize(db->dict))
        dictResize(db->dict);
    if (htNeedsResize(db->expires))
        dictResize(db->expires);
    unlockDb(db);
}

/* Our hash table implementation performs rehashing incrementally while
 * we write/read from the hash table. Still if the server is idle, the hash
 * table will use two tables for a long time. So we try to use 1 millisecond
 * of CPU time at every call of this function to perform some rehahsing.
 *
 * The function returns 1 if some rehashing was performed, otherwise 0
 * is returned. */
int incrementallyRehashForDb(int dbid) {
    redisDb *db;

    db = darray_get(&server.dbs, dbid);
    lockDbWrite(db);
    
    /* Keys dictionary */
    if (dictIsRehashing(db->dict)) {
        dictRehashMilliseconds(db->dict,1);
        unlockDb(db);
        return 1; /* already used our millisecond for this loop... */
    }
    /* Expires */
    if (dictIsRehashing(db->expires)) {
        dictRehashMilliseconds(db->expires,1);
        unlockDb(db);
        return 1; /* already used our millisecond for this loop... */
    }

    unlockDb(db);
    return 0;
}

/* Try to expire a few timed out keys. The algorithm used is adaptive and
 * will use few CPU cycles if there are few expiring keys, otherwise
 * it will get more aggressive to avoid that too much memory is used by
 * keys that can be removed from the keyspace.
 *
 * No more than CRON_DBS_PER_CALL databases are tested at every
 * iteration.
 *
 * This kind of call is used when Redis detects that timelimit_exit is
 * true, so there is more work to do, and we do it more incrementally from
 * the beforeSleep() function of the event loop.
 *
 * Expire cycle type:
 *
 * If type is ACTIVE_EXPIRE_CYCLE_FAST the function will try to run a
 * "fast" expire cycle that takes no longer than EXPIRE_FAST_CYCLE_DURATION
 * microseconds, and is not repeated again before the same amount of time.
 *
 * If type is ACTIVE_EXPIRE_CYCLE_SLOW, that normal expire cycle is
 * executed, where the time limit is a percentage of the REDIS_HZ period
 * as specified by the REDIS_EXPIRELOOKUPS_TIME_PERC define. */

void activeExpireCycle(vr_backend *backend, int type) {
    int j, iteration = 0;
    int dbs_per_call = CRON_DBS_PER_CALL;
    long long start = vr_usec_now(), timelimit;
    long long expired_total = 0;

    if (type == ACTIVE_EXPIRE_CYCLE_FAST) {
        /* Don't start a fast cycle if the previous cycle did not exited
         * for time limt. Also don't repeat a fast cycle for the same period
         * as the fast cycle total duration itself. */
        if (!backend->timelimit_exit) return;
        if (start < backend->last_fast_cycle + ACTIVE_EXPIRE_CYCLE_FAST_DURATION*2) return;
        backend->last_fast_cycle = start;
    }

    /* We usually should test CRON_DBS_PER_CALL per iteration, with
     * two exceptions:
     *
     * 1) Don't test more DBs than we have.
     * 2) If last time we hit the time limit, we want to scan all DBs
     * in this iteration, as there is work to do in some DB and we don't want
     * expired keys to use memory for too much time. */
    if (dbs_per_call > server.dbnum || backend->timelimit_exit)
        dbs_per_call = server.dbnum;

    /* We can use at max ACTIVE_EXPIRE_CYCLE_SLOW_TIME_PERC percentage of CPU time
     * per iteration. Since this function gets called with a frequency of
     * server.hz times per second, the following is the max amount of
     * microseconds we can spend in this function. */
    timelimit = 1000000*ACTIVE_EXPIRE_CYCLE_SLOW_TIME_PERC/server.hz/100;
    backend->timelimit_exit = 0;
    if (timelimit <= 0) timelimit = 1;

    if (type == ACTIVE_EXPIRE_CYCLE_FAST)
        timelimit = ACTIVE_EXPIRE_CYCLE_FAST_DURATION; /* in microseconds. */

    for (j = 0; j < dbs_per_call; j++) {
        int expired;
        redisDb *db = darray_get(&server.dbs, backend->current_db%server.dbnum);

        /* Increment the DB now so we are sure if we run out of time
         * in the current DB we'll restart from the next. This allows to
         * distribute the time evenly across DBs. */
        backend->current_db++;
        
        lockDbWrite(db);
        /* Continue to expire if at the end of the cycle more than 25%
         * of the keys were expired. */
        do {
            unsigned long num, slots;
            long long now, ttl_sum;
            int ttl_samples;
            /* If there is nothing to expire try next DB ASAP. */
            if ((num = dictSize(db->expires)) == 0) {
                db->avg_ttl = 0;
                break;
            }
            slots = dictSlots(db->expires);
            now = vr_msec_now();

            /* When there are less than 1% filled slots getting random
             * keys is expensive, so stop here waiting for better times...
             * The dictionary will be resized asap. */
            if (num && slots > DICT_HT_INITIAL_SIZE &&
                (num*100/slots < 1)) break;

            /* The main collection cycle. Sample random keys among keys
             * with an expire set, checking for expired ones. */
            expired = 0;
            ttl_sum = 0;
            ttl_samples = 0;

            if (num > ACTIVE_EXPIRE_CYCLE_LOOKUPS_PER_LOOP)
                num = ACTIVE_EXPIRE_CYCLE_LOOKUPS_PER_LOOP;

            while (num--) {
                dictEntry *de;
                long long ttl;

                if ((de = dictGetRandomKey(db->expires)) == NULL) break;
                ttl = dictGetSignedIntegerVal(de)-now;
                if (activeExpireCycleTryExpire(db,de,now)) expired++;
                if (ttl > 0) {
                    /* We want the average TTL of keys yet not expired. */
                    ttl_sum += ttl;
                    ttl_samples++;
                }
            }

            expired_total += expired;

            /* Update the average TTL stats for this database. */
            if (ttl_samples) {
                long long avg_ttl = ttl_sum/ttl_samples;

                /* Do a simple running average with a few samples.
                 * We just use the current estimate with a weight of 2%
                 * and the previous estimate with a weight of 98%. */
                if (db->avg_ttl == 0) db->avg_ttl = avg_ttl;
                db->avg_ttl = (db->avg_ttl/50)*49 + (avg_ttl/50);
            }

            /* We can't block forever here even if there are many keys to
             * expire. So after a given amount of milliseconds return to the
             * caller waiting for the other active expire cycle. */
            iteration++;
            if ((iteration & 0xf) == 0) { /* check once every 16 iterations. */
                long long elapsed = vr_usec_now()-start;

                //latencyAddSampleIfNeeded("expire-cycle",elapsed/1000);
                if (elapsed > timelimit) backend->timelimit_exit = 1;
            }
            if (backend->timelimit_exit) {
                unlockDb(db);

                if (expired_total > 0) {
                    update_stats_add(backend->vel.stats, expiredkeys, expired_total);
                }
                return;
            }
            /* We don't repeat the cycle if there are less than 25% of keys
             * found expired in the current DB. */
        } while (expired > ACTIVE_EXPIRE_CYCLE_LOOKUPS_PER_LOOP/4);
        unlockDb(db);
    }

    if (expired_total > 0) {
        update_stats_add(backend->vel.stats, expiredkeys, expired_total);
    }
}

int activeExpireCycleTryExpire(redisDb *db, dictEntry *de, long long now) {
    long long t = dictGetSignedIntegerVal(de);
    if (now > t) {
        sds key = dictGetKey(de);
        robj *keyobj = createStringObject(key,sdslen(key));
        dbDelete(db,keyobj);
        freeObject(keyobj);
        return 1;
    } else {
        return 0;
    }
}

/* This function handles 'background' operations we are required to do
 * incrementally in Redis databases, such as active key expiring, resizing,
 * rehashing. */
void databasesCron(vr_backend *backend) {
    /* Expire keys by random sampling. Not required for slaves
     * as master will synthesize DELs for us. */
    if (repl.masterhost == NULL)
        activeExpireCycle(backend, ACTIVE_EXPIRE_CYCLE_SLOW);

    /* Perform hash tables rehashing if needed, but only if there are no
     * other processes saving the DB on disk. Otherwise rehashing is bad
     * as will cause a lot of copy-on-write of memory pages. */
    if (server.rdb_child_pid == -1 && server.aof_child_pid == -1) {
        int dbs_per_call = CRON_DBS_PER_CALL;
        int j;

        /* Don't test more DBs than we have. */
        if (dbs_per_call > server.dbnum) dbs_per_call = server.dbnum;

        /* Resize */
        for (j = 0; j < dbs_per_call; j++) {
            tryResizeHashTablesForDb(backend->resize_db%server.dbnum);
            backend->resize_db++;
        }

        /* Rehash */
        if (server.activerehashing) {
            for (j = 0; j < dbs_per_call; j++) {
                int work_done = incrementallyRehashForDb(backend->rehash_db%server.dbnum);
                backend->rehash_db++;
                if (work_done) {
                    /* If the function did some work, stop here, we'll do
                     * more at the next cron loop. */
                    break;
                }
            }
        }
    }
}


================================================
FILE: src/vr_db.h
================================================
#ifndef _VR_DB_H_
#define _VR_DB_H_

/* To improve the quality of the LRU approximation we take a set of keys
 * that are good candidate for eviction across freeMemoryIfNeeded() calls.
 *
 * Entries inside the eviciton pool are taken ordered by idle time, putting
 * greater idle times to the right (ascending order).
 *
 * Empty entries have the key pointer set to NULL. */
#define MAXMEMORY_EVICTION_POOL_SIZE 16
struct evictionPoolEntry {
    unsigned long long idle;    /* Object idle time. */
    sds key;                    /* Key name. */
};

/* Vire database representation. There are multiple databases identified
 * by integers from 0 (the default database) up to the max configured
 * database. The database number is the 'id' field in the structure. */
typedef struct redisDb {
    dict *dict;                 /* The keyspace for this DB */
    dict *expires;              /* Timeout of keys with a timeout set */
    dict *blocking_keys;        /* Keys with clients waiting for data (BLPOP) */
    dict *ready_keys;           /* Blocked keys that received a PUSH */
    dict *watched_keys;         /* WATCHED keys for MULTI/EXEC CAS */
    struct evictionPoolEntry *eviction_pool;    /* Eviction pool of keys */
    int id;                     /* Database ID */
    long long avg_ttl;          /* Average TTL, just for stats */

    pthread_rwlock_t rwl;       /* read write lock */
} redisDb;

extern dictType dbDictType;
extern dictType keyptrDictType;
extern dictType keylistDictType;

int redisDbInit(redisDb *db);
int redisDbDeinit(redisDb *db);

int lockDbRead(redisDb *db);
int lockDbWrite(redisDb *db);
int unlockDb(redisDb *db);

robj *lookupKey(redisDb *db, robj *key);
robj *lookupKeyRead(redisDb *db, robj *key);
robj *lookupKeyWrite(redisDb *db, robj *key, int *expired);
robj *lookupKeyReadOrReply(struct client *c, robj *key, robj *reply);
robj *lookupKeyWriteOrReply(struct client *c, robj *key, robj *reply, int *expired);
void dbAdd(redisDb *db, robj *key, robj *val);
void dbOverwrite(redisDb *db, robj *key, robj *val);
void setKey(redisDb *db, robj *key, robj *val, int *expired);
int dbExists(redisDb *db, robj *key);
robj *dbRandomKey(redisDb *db);
int dbDelete(redisDb *db, robj *key);
robj *dbUnshareStringValue(redisDb *db, robj *key, robj *o);
long long emptyDb(void(callback)(void*));
int selectDb(struct client *c, int id);
void signalModifiedKey(redisDb *db, robj *key);
void signalFlushedDb(int dbid);
void flushdbCommand(struct client *c);
void flushallCommand(struct client *c);
void delCommand(struct client *c);
void existsCommand(struct client *c);
void selectCommand(struct client *c);
void randomkeyCommand(struct client *c);
void keysCommand(struct client *c);
void scanCallback(void *privdata, const dictEntry *de);
int parseScanCursorOrReply(struct client *c, robj *o, unsigned long *cursor);
void scanGenericCommand(struct client *c, int scantype);
void scanCommand(struct client *c);
void dbsizeCommand(struct client *c);
void lastsaveCommand(struct client *c);
void typeCommand(struct client *c);
void shutdownCommand(struct client *c);
void renameGenericCommand(struct client *c, int nx);
void renameCommand(struct client *c);
void renamenxCommand(struct client *c);
void moveCommand(struct client *c);
int removeExpire(redisDb *db, robj *key);
void setExpire(redisDb *db, robj *key, long long when);
long long getExpire(redisDb *db, robj *key);
void propagateExpire(redisDb *db, robj *key);
int checkIfExpired(redisDb *db, robj *key);
int expireIfNeeded(redisDb *db, robj *key);
void expireGenericCommand(struct client *c, long long basetime, int unit);
void expireCommand(struct client *c);
void expireatCommand(struct client *c);
void pexpireCommand(struct client *c);
void pexpireatCommand(struct client *c);
void ttlGenericCommand(struct client *c, int output_ms);
void ttlCommand(struct client *c);
void pttlCommand(struct client *c);
void persistCommand(struct client *c);
int *getKeysUsingCommandTable(struct redisCommand *cmd,robj **argv, int argc, int *numkeys);
int *getKeysFromCommand(struct redisCommand *cmd, robj **argv, int argc, int *numkeys);
void getKeysFreeResult(int *result);
int *zunionInterGetKeys(struct redisCommand *cmd, robj **argv, int argc, int *numkeys);
int *evalGetKeys(struct redisCommand *cmd, robj **argv, int argc, int *numkeys);
int *sortGetKeys(struct redisCommand *cmd, robj **argv, int argc, int *numkeys);
int *migrateGetKeys(struct redisCommand *cmd, robj **argv, int argc, int *numkeys);

int fetchInternalDbByKey(struct client *c, robj *key);
int fetchInternalDbById(struct client *c, int idx);

void tryResizeHashTablesForDb(int dbid);
int incrementallyRehashForDb(int dbid);
void activeExpireCycle(vr_backend *backend, int type);
int activeExpireCycleTryExpire(redisDb *db, dictEntry *de, long long now);
void databasesCron(vr_backend *backend);

#endif


================================================
FILE: src/vr_dict.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <stdarg.h>
#include <limits.h>
#include <sys/time.h>
#include <ctype.h>

#include <vr_core.h>

/* Using dictEnableResize() / dictDisableResize() we make possible to
 * enable/disable resizing of the hash table as needed. This is very important
 * for Redis, as we use copy-on-write and don't want to move too much memory
 * around when there is a child performing saving operations.
 *
 * Note that even when dict_can_resize is set to 0, not all resizes are
 * prevented: a hash table is still allowed to grow if the ratio between
 * the number of elements and the buckets > dict_force_resize_ratio. */
static int dict_can_resize = 1;
static unsigned int dict_force_resize_ratio = 5;

/* -------------------------- private prototypes ---------------------------- */

static int _dictExpandIfNeeded(dict *ht);
static unsigned long _dictNextPower(unsigned long size);
static int _dictKeyIndex(dict *ht, const void *key);
static int _dictInit(dict *ht, dictType *type, void *privDataPtr);

/* -------------------------- hash functions -------------------------------- */

/* Thomas Wang's 32 bit Mix Function */
unsigned int dictIntHashFunction(unsigned int key)
{
    key += ~(key << 15);
    key ^=  (key >> 10);
    key +=  (key << 3);
    key ^=  (key >> 6);
    key += ~(key << 11);
    key ^=  (key >> 16);
    return key;
}

static uint32_t dict_hash_function_seed = 5381;

void dictSetHashFunctionSeed(uint32_t seed) {
    dict_hash_function_seed = seed;
}

uint32_t dictGetHashFunctionSeed(void) {
    return dict_hash_function_seed;
}

/* MurmurHash2, by Austin Appleby
 * Note - This code makes a few assumptions about how your machine behaves -
 * 1. We can read a 4-byte value from any address without crashing
 * 2. sizeof(int) == 4
 *
 * And it has a few limitations -
 *
 * 1. It will not work incrementally.
 * 2. It will not produce the same results on little-endian and big-endian
 *    machines.
 */
unsigned int dictGenHashFunction(const void *key, int len) {
    /* 'm' and 'r' are mixing constants generated offline.
     They're not really 'magic', they just happen to work well.  */
    uint32_t seed = dict_hash_function_seed;
    const uint32_t m = 0x5bd1e995;
    const int r = 24;

    /* Initialize the hash to a 'random' value */
    uint32_t h = seed ^ len;

    /* Mix 4 bytes at a time into the hash */
    const unsigned char *data = (const unsigned char *)key;

    while(len >= 4) {
        uint32_t k = *(uint32_t*)data;

        k *= m;
        k ^= k >> r;
        k *= m;

        h *= m;
        h ^= k;

        data += 4;
        len -= 4;
    }

    /* Handle the last few bytes of the input array  */
    switch(len) {
    case 3: h ^= data[2] << 16;
    case 2: h ^= data[1] << 8;
    case 1: h ^= data[0]; h *= m;
    };

    /* Do a few final mixes of the hash to ensure the last few
     * bytes are well-incorporated. */
    h ^= h >> 13;
    h *= m;
    h ^= h >> 15;

    return (unsigned int)h;
}

/* And a case insensitive hash function (based on djb hash) */
unsigned int dictGenCaseHashFunction(const unsigned char *buf, int len) {
    unsigned int hash = (unsigned int)dict_hash_function_seed;

    while (len--)
        hash = ((hash << 5) + hash) + (tolower(*buf++)); /* hash * 33 + c */
    return hash;
}

/* ----------------------------- API implementation ------------------------- */

/* Reset a hash table already initialized with ht_init().
 * NOTE: This function should only be called by ht_destroy(). */
static void _dictReset(dictht *ht)
{
    ht->table = NULL;
    ht->size = 0;
    ht->sizemask = 0;
    ht->used = 0;
}

/* Create a new hash table */
dict *dictCreate(dictType *type,
        void *privDataPtr)
{
    dict *d = dalloc(sizeof(*d));

    _dictInit(d,type,privDataPtr);
    return d;
}

/* Initialize the hash table */
int _dictInit(dict *d, dictType *type,
        void *privDataPtr)
{
    _dictReset(&d->ht[0]);
    _dictReset(&d->ht[1]);
    d->type = type;
    d->privdata = privDataPtr;
    d->rehashidx = -1;
    d->iterators = 0;
    return DICT_OK;
}

/* Resize the table to the minimal size that contains all the elements,
 * but with the invariant of a USED/BUCKETS ratio near to <= 1 */
int dictResize(dict *d)
{
    int minimal;

    if (!dict_can_resize || dictIsRehashing(d)) return DICT_ERR;
    minimal = d->ht[0].used;
    if (minimal < DICT_HT_INITIAL_SIZE)
        minimal = DICT_HT_INITIAL_SIZE;
    return dictExpand(d, minimal);
}

/* Expand or create the hash table */
int dictExpand(dict *d, unsigned long size)
{
    dictht n; /* the new hash table */
    unsigned long realsize = _dictNextPower(size);

    /* the size is invalid if it is smaller than the number of
     * elements already inside the hash table */
    if (dictIsRehashing(d) || d->ht[0].used > size)
        return DICT_ERR;

    /* Rehashing to the same table size is not useful. */
    if (realsize == d->ht[0].size) return DICT_ERR;

    /* Allocate the new hash table and initialize all pointers to NULL */
    n.size = realsize;
    n.sizemask = realsize-1;
    n.table = dcalloc(realsize, sizeof(dictEntry*));
    n.used = 0;

    /* Is this the first initialization? If so it's not really a rehashing
     * we just set the first hash table so that it can accept keys. */
    if (d->ht[0].table == NULL) {
        d->ht[0] = n;
        return DICT_OK;
    }

    /* Prepare a second hash table for incremental rehashing */
    d->ht[1] = n;
    d->rehashidx = 0;
    return DICT_OK;
}

/* Performs N steps of incremental rehashing. Returns 1 if there are still
 * keys to move from the old to the new hash table, otherwise 0 is returned.
 *
 * Note that a rehashing step consists in moving a bucket (that may have more
 * than one key as we use chaining) from the old to the new hash table, however
 * since part of the hash table may be composed of empty spaces, it is not
 * guaranteed that this function will rehash even a single bucket, since it
 * will visit at max N*10 empty buckets in total, otherwise the amount of
 * work it does would be unbound and the function may block for a long time. */
int dictRehash(dict *d, int n) {
    int empty_visits = n*10; /* Max number of empty buckets to visit. */
    if (!dictIsRehashing(d)) return 0;

    while(n-- && d->ht[0].used != 0) {
        dictEntry *de, *nextde;

        /* Note that rehashidx can't overflow as we are sure there are more
         * elements because ht[0].used != 0 */
        ASSERT(d->ht[0].size > (unsigned long)d->rehashidx);
        while(d->ht[0].table[d->rehashidx] == NULL) {
            d->rehashidx++;
            if (--empty_visits == 0) return 1;
        }
        de = d->ht[0].table[d->rehashidx];
        /* Move all the keys in this bucket from the old to the new hash HT */
        while(de) {
            unsigned int h;

            nextde = de->next;
            /* Get the index in the new hash table */
            h = dictHashKey(d, de->key) & d->ht[1].sizemask;
            de->next = d->ht[1].table[h];
            d->ht[1].table[h] = de;
            d->ht[0].used--;
            d->ht[1].used++;
            de = nextde;
        }
        d->ht[0].table[d->rehashidx] = NULL;
        d->rehashidx++;
    }

    /* Check if we already rehashed the whole table... */
    if (d->ht[0].used == 0) {
        dfree(d->ht[0].table);
        d->ht[0] = d->ht[1];
        _dictReset(&d->ht[1]);
        d->rehashidx = -1;
        return 0;
    }

    /* More to rehash... */
    return 1;
}

long long timeInMilliseconds(void) {
    struct timeval tv;

    gettimeofday(&tv,NULL);
    return (((long long)tv.tv_sec)*1000)+(tv.tv_usec/1000);
}

/* Rehash for an amount of time between ms milliseconds and ms+1 milliseconds */
int dictRehashMilliseconds(dict *d, int ms) {
    long long start = timeInMilliseconds();
    int rehashes = 0;

    while(dictRehash(d,100)) {
        rehashes += 100;
        if (timeInMilliseconds()-start > ms) break;
    }
    return rehashes;
}

/* This function performs just a step of rehashing, and only if there are
 * no safe iterators bound to our hash table. When we have iterators in the
 * middle of a rehashing we can't mess with the two hash tables otherwise
 * some element can be missed or duplicated.
 *
 * This function is called by common lookup or update operations in the
 * dictionary so that the hash table automatically migrates from H1 to H2
 * while it is actively used. */
static void _dictRehashStep(dict *d) {
    if (d->iterators == 0) dictRehash(d,1);
}

/* Add an element to the target hash table */
int dictAdd(dict *d, void *key, void *val)
{
    dictEntry *entry = dictAddRaw(d,key);

    if (!entry) return DICT_ERR;
    dictSetVal(d, entry, val);
    return DICT_OK;
}

/* Low level add. This function adds the entry but instead of setting
 * a value returns the dictEntry structure to the user, that will make
 * sure to fill the value field as he wishes.
 *
 * This function is also directly exposed to the user API to be called
 * mainly in order to store non-pointers inside the hash value, example:
 *
 * entry = dictAddRaw(dict,mykey);
 * if (entry != NULL) dictSetSignedIntegerVal(entry,1000);
 *
 * Return values:
 *
 * If key already exists NULL is returned.
 * If key was added, the hash entry is returned to be manipulated by the caller.
 */
dictEntry *dictAddRaw(dict *d, void *key)
{
    int index;
    dictEntry *entry;
    dictht *ht;

    if (dictIsRehashing(d)) _dictRehashStep(d);

    /* Get the index of the new element, or -1 if
     * the element already exists. */
    if ((index = _dictKeyIndex(d, key)) == -1)
        return NULL;

    /* Allocate the memory and store the new entry.
     * Insert the element in top, with the assumption that in a database
     * system it is more likely that recently added entries are accessed
     * more frequently. */
    ht = dictIsRehashing(d) ? &d->ht[1] : &d->ht[0];
    entry = dalloc(sizeof(*entry));
    entry->next = ht->table[index];
    ht->table[index] = entry;
    ht->used++;

    /* Set the hash entry fields. */
    dictSetKey(d, entry, key);
    return entry;
}

/* Add an element, discarding the old if the key already exists.
 * Return 1 if the key was added from scratch, 0 if there was already an
 * element with such key and dictReplace() just performed a value update
 * operation. */
int dictReplace(dict *d, void *key, void *val)
{
    dictEntry *entry, auxentry;

    /* Try to add the element. If the key
     * does not exists dictAdd will suceed. */
    if (dictAdd(d, key, val) == DICT_OK)
        return 1;
    /* It already exists, get the entry */
    entry = dictFind(d, key);
    /* Set the new value and free the old one. Note that it is important
     * to do that in this order, as the value may just be exactly the same
     * as the previous one. In this context, think to reference counting,
     * you want to increment (set), and then decrement (free), and not the
     * reverse. */
    auxentry = *entry;
    dictSetVal(d, entry, val);
    dictFreeVal(d, &auxentry);
    return 0;
}

/* dictReplaceRaw() is simply a version of dictAddRaw() that always
 * returns the hash entry of the specified key, even if the key already
 * exists and can't be added (in that case the entry of the already
 * existing key is returned.)
 *
 * See dictAddRaw() for more information. */
dictEntry *dictReplaceRaw(dict *d, void *key) {
    dictEntry *entry = dictFind(d,key);

    return entry ? entry : dictAddRaw(d,key);
}

/* Search and remove an element */
static int dictGenericDelete(dict *d, const void *key, int nofree)
{
    unsigned int h, idx;
    dictEntry *he, *prevHe;
    int table;

    if (d->ht[0].size == 0) return DICT_ERR; /* d->ht[0].table is NULL */
    if (dictIsRehashing(d)) _dictRehashStep(d);
    h = dictHashKey(d, key);

    for (table = 0; table <= 1; table++) {
        idx = h & d->ht[table].sizemask;
        he = d->ht[table].table[idx];
        prevHe = NULL;
        while(he) {
            if (key==he->key || dictCompareKeys(d, key, he->key)) {
                /* Unlink the element from the list */
                if (prevHe)
                    prevHe->next = he->next;
                else
                    d->ht[table].table[idx] = he->next;
                if (!nofree) {
                    dictFreeKey(d, he);
                    dictFreeVal(d, he);
                }
                dfree(he);
                d->ht[table].used--;
                return DICT_OK;
            }
            prevHe = he;
            he = he->next;
        }
        if (!dictIsRehashing(d)) break;
    }
    return DICT_ERR; /* not found */
}

int dictDelete(dict *ht, const void *key) {
    return dictGenericDelete(ht,key,0);
}

int dictDeleteNoFree(dict *ht, const void *key) {
    return dictGenericDelete(ht,key,1);
}

/* Destroy an entire dictionary */
int _dictClear(dict *d, dictht *ht, void(callback)(void *)) {
    unsigned long i;

    /* Free all the elements */
    for (i = 0; i < ht->size && ht->used > 0; i++) {
        dictEntry *he, *nextHe;

        if (callback && (i & 65535) == 0) callback(d->privdata);

        if ((he = ht->table[i]) == NULL) continue;
        while(he) {
            nextHe = he->next;
            dictFreeKey(d, he);
            dictFreeVal(d, he);
            dfree(he);
            ht->used--;
            he = nextHe;
        }
    }
    /* Free the table and the allocated cache structure */
    if(ht->table) dfree(ht->table);
    /* Re-initialize the table */
    _dictReset(ht);
    return DICT_OK; /* never fails */
}

/* Clear & Release the hash table */
void dictRelease(dict *d)
{
    _dictClear(d,&d->ht[0],NULL);
    _dictClear(d,&d->ht[1],NULL);
    dfree(d);
}

dictEntry *dictFind(dict *d, const void *key)
{
    dictEntry *he;
    unsigned int h, idx, table;

    if (d->ht[0].used + d->ht[1].used == 0) return NULL; /* dict is empty */
    //if (dictIsRehashing(d)) _dictRehashStep(d);  /* we removed this line to avoild rehash the table when read this table, because  we used read-write lock */
    h = dictHashKey(d, key);
    for (table = 0; table <= 1; table++) {
        idx = h & d->ht[table].sizemask;
        he = d->ht[table].table[idx];
        while(he) {
            if (key==he->key || dictCompareKeys(d, key, he->key))
                return he;
            he = he->next;
        }
        if (!dictIsRehashing(d)) return NULL;
    }
    return NULL;
}

void *dictFetchValue(dict *d, const void *key) {
    dictEntry *he;

    he = dictFind(d,key);
    return he ? dictGetVal(he) : NULL;
}

/* A fingerprint is a 64 bit number that represents the state of the dictionary
 * at a given time, it's just a few dict properties xored together.
 * When an unsafe iterator is initialized, we get the dict fingerprint, and check
 * the fingerprint again when the iterator is released.
 * If the two fingerprints are different it means that the user of the iterator
 * performed forbidden operations against the dictionary while iterating. */
long long dictFingerprint(dict *d) {
    long long integers[6], hash = 0;
    int j;

    integers[0] = (long) d->ht[0].table;
    integers[1] = d->ht[0].size;
    integers[2] = d->ht[0].used;
    integers[3] = (long) d->ht[1].table;
    integers[4] = d->ht[1].size;
    integers[5] = d->ht[1].used;

    /* We hash N integers by summing every successive integer with the integer
     * hashing of the previous sum. Basically:
     *
     * Result = hash(hash(hash(int1)+int2)+int3) ...
     *
     * This way the same set of integers in a different order will (likely) hash
     * to a different number. */
    for (j = 0; j < 6; j++) {
        hash += integers[j];
        /* For the hashing step we use Tomas Wang's 64 bit integer hash. */
        hash = (~hash) + (hash << 21); // hash = (hash << 21) - hash - 1;
        hash = hash ^ (hash >> 24);
        hash = (hash + (hash << 3)) + (hash << 8); // hash * 265
        hash = hash ^ (hash >> 14);
        hash = (hash + (hash << 2)) + (hash << 4); // hash * 21
        hash = hash ^ (hash >> 28);
        hash = hash + (hash << 31);
    }
    return hash;
}

dictIterator *dictGetIterator(dict *d)
{
    dictIterator *iter = dalloc(sizeof(*iter));

    iter->d = d;
    iter->table = 0;
    iter->index = -1;
    iter->safe = 0;
    iter->entry = NULL;
    iter->nextEntry = NULL;
    return iter;
}

dictIterator *dictGetSafeIterator(dict *d) {
    dictIterator *i = dictGetIterator(d);

    i->safe = 1;
    return i;
}

dictEntry *dictNext(dictIterator *iter)
{
    while (1) {
        if (iter->entry == NULL) {
            dictht *ht = &iter->d->ht[iter->table];
            if (iter->index == -1 && iter->table == 0) {
                if (iter->safe)
                    iter->d->iterators++;
                else
                    iter->fingerprint = dictFingerprint(iter->d);
            }
            iter->index++;
            if (iter->index >= (long) ht->size) {
                if (dictIsRehashing(iter->d) && iter->table == 0) {
                    iter->table++;
                    iter->index = 0;
                    ht = &iter->d->ht[1];
                } else {
                    break;
                }
            }
            iter->entry = ht->table[iter->index];
        } else {
            iter->entry = iter->nextEntry;
        }
        if (iter->entry) {
            /* We need to save the 'next' here, the iterator user
             * may delete the entry we are returning. */
            iter->nextEntry = iter->entry->next;
            return iter->entry;
        }
    }
    return NULL;
}

void dictReleaseIterator(dictIterator *iter)
{
    if (!(iter->index == -1 && iter->table == 0)) {
        if (iter->safe) {
            iter->d->iterators--;
        } else {
            long long hv = dictFingerprint(iter->d);
            ASSERT(iter->fingerprint == hv);
        }
    }
    dfree(iter);
}

/* Return a random entry from the hash table. Useful to
 * implement randomized algorithms */
dictEntry *dictGetRandomKey(dict *d)
{
    dictEntry *he, *orighe;
    unsigned int h;
    int listlen, listele;

    if (dictSize(d) == 0) return NULL;
    if (dictIsRehashing(d)) _dictRehashStep(d);
    if (dictIsRehashing(d)) {
        do {
            /* We are sure there are no elements in indexes from 0
             * to rehashidx-1 */
            h = d->rehashidx + (random() % (d->ht[0].size +
                                            d->ht[1].size -
                                            d->rehashidx));
            he = (h >= d->ht[0].size) ? d->ht[1].table[h - d->ht[0].size] :
                                      d->ht[0].table[h];
        } while(he == NULL);
    } else {
        do {
            h = random() & d->ht[0].sizemask;
            he = d->ht[0].table[h];
        } while(he == NULL);
    }

    /* Now we found a non empty bucket, but it is a linked
     * list and we need to get a random element from the list.
     * The only sane way to do so is counting the elements and
     * select a random index. */
    listlen = 0;
    orighe = he;
    while(he) {
        he = he->next;
        listlen++;
    }
    listele = random() % listlen;
    he = orighe;
    while(listele--) he = he->next;
    return he;
}

/* This function samples the dictionary to return a few keys from random
 * locations.
 *
 * It does not guarantee to return all the keys specified in 'count', nor
 * it does guarantee to return non-duplicated elements, however it will make
 * some effort to do both things.
 *
 * Returned pointers to hash table entries are stored into 'des' that
 * points to an array of dictEntry pointers. The array must have room for
 * at least 'count' elements, that is the argument we pass to the function
 * to tell how many random elements we need.
 *
 * The function returns the number of items stored into 'des', that may
 * be less than 'count' if the hash table has less than 'count' elements
 * inside, or if not enough elements were found in a reasonable amount of
 * steps.
 *
 * Note that this function is not suitable when you need a good distribution
 * of the returned items, but only when you need to "sample" a given number
 * of continuous elements to run some kind of algorithm or to produce
 * statistics. However the function is much faster than dictGetRandomKey()
 * at producing N elements. */
unsigned int dictGetSomeKeys(dict *d, dictEntry **des, unsigned int count) {
    unsigned long j; /* internal hash table id, 0 or 1. */
    unsigned long tables; /* 1 or 2 tables? */
    unsigned long stored = 0, maxsizemask;
    unsigned long maxsteps;

    if (dictSize(d) < count) count = dictSize(d);
    maxsteps = count*10;

    /* Try to do a rehashing work proportional to 'count'. */
    for (j = 0; j < count; j++) {
        if (dictIsRehashing(d))
            _dictRehashStep(d);
        else
            break;
    }

    tables = dictIsRehashing(d) ? 2 : 1;
    maxsizemask = d->ht[0].sizemask;
    if (tables > 1 && maxsizemask < d->ht[1].sizemask)
        maxsizemask = d->ht[1].sizemask;

    /* Pick a random point inside the larger table. */
    unsigned long i = random() & maxsizemask;
    unsigned long emptylen = 0; /* Continuous empty entries so far. */
    while(stored < count && maxsteps--) {
        for (j = 0; j < tables; j++) {
            /* Invariant of the dict.c rehashing: up to the indexes already
             * visited in ht[0] during the rehashing, there are no populated
             * buckets, so we can skip ht[0] for indexes between 0 and idx-1. */
            if (tables == 2 && j == 0 && i < (unsigned long) d->rehashidx) {
                /* Moreover, if we are currently out of range in the second
                 * table, there will be no elements in both tables up to
                 * the current rehashing index, so we jump if possible.
                 * (this happens when going from big to small table). */
                if (i >= d->ht[1].size) i = d->rehashidx;
                continue;
            }
            if (i >= d->ht[j].size) continue; /* Out of range for this table. */
            dictEntry *he = d->ht[j].table[i];

            /* Count contiguous empty buckets, and jump to other
             * locations if they reach 'count' (with a minimum of 5). */
            if (he == NULL) {
                emptylen++;
                if (emptylen >= 5 && emptylen > count) {
                    i = random() & maxsizemask;
                    emptylen = 0;
                }
            } else {
                emptylen = 0;
                while (he) {
                    /* Collect all the elements of the buckets found non
                     * empty while iterating. */
                    *des = he;
                    des++;
                    he = he->next;
                    stored++;
                    if (stored == count) return stored;
                }
            }
        }
        i = (i+1) & maxsizemask;
    }
    return stored;
}

/* Function to reverse bits. Algorithm from:
 * http://graphics.stanford.edu/~seander/bithacks.html#ReverseParallel */
static unsigned long rev(unsigned long v) {
    unsigned long s = 8 * sizeof(v); // bit size; must be power of 2
    unsigned long mask = ~0;
    while ((s >>= 1) > 0) {
        mask ^= (mask << s);
        v = ((v >> s) & mask) | ((v << s) & ~mask);
    }
    return v;
}

/* dictScan() is used to iterate over the elements of a dictionary.
 *
 * Iterating works the following way:
 *
 * 1) Initially you call the function using a cursor (v) value of 0.
 * 2) The function performs one step of the iteration, and returns the
 *    new cursor value you must use in the next call.
 * 3) When the returned cursor is 0, the iteration is complete.
 *
 * The function guarantees all elements present in the
 * dictionary get returned between the start and end of the iteration.
 * However it is possible some elements get returned multiple times.
 *
 * For every element returned, the callback argument 'fn' is
 * called with 'privdata' as first argument and the dictionary entry
 * 'de' as second argument.
 *
 * HOW IT WORKS.
 *
 * The iteration algorithm was designed by Pieter Noordhuis.
 * The main idea is to increment a cursor starting from the higher order
 * bits. That is, instead of incrementing the cursor normally, the bits
 * of the cursor are reversed, then the cursor is incremented, and finally
 * the bits are reversed again.
 *
 * This strategy is needed because the hash table may be resized between
 * iteration calls.
 *
 * dict.c hash tables are always power of two in size, and they
 * use chaining, so the position of an element in a given table is given
 * by computing the bitwise AND between Hash(key) and SIZE-1
 * (where SIZE-1 is always the mask that is equivalent to taking the rest
 *  of the division between the Hash of the key and SIZE).
 *
 * For example if the current hash table size is 16, the mask is
 * (in binary) 1111. The position of a key in the hash table will always be
 * the last four bits of the hash output, and so forth.
 *
 * WHAT HAPPENS IF THE TABLE CHANGES IN SIZE?
 *
 * If the hash table grows, elements can go anywhere in one multiple of
 * the old bucket: for example let's say we already iterated with
 * a 4 bit cursor 1100 (the mask is 1111 because hash table size = 16).
 *
 * If the hash table will be resized to 64 elements, then the new mask will
 * be 111111. The new buckets you obtain by substituting in ??1100
 * with either 0 or 1 can be targeted only by keys we already visited
 * when scanning the bucket 1100 in the smaller hash table.
 *
 * By iterating the higher bits first, because of the inverted counter, the
 * cursor does not need to restart if the table size gets bigger. It will
 * continue iterating using cursors without '1100' at the end, and also
 * without any other combination of the final 4 bits already explored.
 *
 * Similarly when the table size shrinks over time, for example going from
 * 16 to 8, if a combination of the lower three bits (the mask for size 8
 * is 111) were already completely explored, it would not be visited again
 * because we are sure we tried, for example, both 0111 and 1111 (all the
 * variations of the higher bit) so we don't need to test it again.
 *
 * WAIT... YOU HAVE *TWO* TABLES DURING REHASHING!
 *
 * Yes, this is true, but we always iterate the smaller table first, then
 * we test all the expansions of the current cursor into the larger
 * table. For example if the current cursor is 101 and we also have a
 * larger table of size 16, we also test (0)101 and (1)101 inside the larger
 * table. This reduces the problem back to having only one table, where
 * the larger one, if it exists, is just an expansion of the smaller one.
 *
 * LIMITATIONS
 *
 * This iterator is completely stateless, and this is a huge advantage,
 * including no additional memory used.
 *
 * The disadvantages resulting from this design are:
 *
 * 1) It is possible we return elements more than once. However this is usually
 *    easy to deal with in the application level.
 * 2) The iterator must return multiple elements per call, as it needs to always
 *    return all the keys chained in a given bucket, and all the expansions, so
 *    we are sure we don't miss keys moving during rehashing.
 * 3) The reverse cursor is somewhat hard to understand at first, but this
 *    comment is supposed to help.
 */
unsigned long dictScan(dict *d,
                       unsigned long v,
                       dictScanFunction *fn,
                       void *privdata)
{
    dictht *t0, *t1;
    const dictEntry *de;
    unsigned long m0, m1;

    if (dictSize(d) == 0) return 0;

    if (!dictIsRehashing(d)) {
        t0 = &(d->ht[0]);
        m0 = t0->sizemask;

        /* Emit entries at cursor */
        de = t0->table[v & m0];
        while (de) {
            fn(privdata, de);
            de = de->next;
        }

    } else {
        t0 = &d->ht[0];
        t1 = &d->ht[1];

        /* Make sure t0 is the smaller and t1 is the bigger table */
        if (t0->size > t1->size) {
            t0 = &d->ht[1];
            t1 = &d->ht[0];
        }

        m0 = t0->sizemask;
        m1 = t1->sizemask;

        /* Emit entries at cursor */
        de = t0->table[v & m0];
        while (de) {
            fn(privdata, de);
            de = de->next;
        }

        /* Iterate over indices in larger table that are the expansion
         * of the index pointed to by the cursor in the smaller table */
        do {
            /* Emit entries at cursor */
            de = t1->table[v & m1];
            while (de) {
                fn(privdata, de);
                de = de->next;
            }

            /* Increment bits not covered by the smaller mask */
            v = (((v | m0) + 1) & ~m0) | (v & m0);

            /* Continue while bits covered by mask difference is non-zero */
        } while (v & (m0 ^ m1));
    }

    /* Set unmasked bits so incrementing the reversed cursor
     * operates on the masked bits of the smaller table */
    v |= ~m0;

    /* Increment the reverse cursor */
    v = rev(v);
    v++;
    v = rev(v);

    return v;
}

/* ------------------------- private functions ------------------------------ */

/* Expand the hash table if needed */
static int _dictExpandIfNeeded(dict *d)
{
    /* Incremental rehashing already in progress. Return. */
    if (dictIsRehashing(d)) return DICT_OK;

    /* If the hash table is empty expand it to the initial size. */
    if (d->ht[0].size == 0) return dictExpand(d, DICT_HT_INITIAL_SIZE);

    /* If we reached the 1:1 ratio, and we are allowed to resize the hash
     * table (global setting) or we should avoid it but the ratio between
     * elements/buckets is over the "safe" threshold, we resize doubling
     * the number of buckets. */
    if (d->ht[0].used >= d->ht[0].size &&
        (dict_can_resize ||
         d->ht[0].used/d->ht[0].size > dict_force_resize_ratio))
    {
        return dictExpand(d, d->ht[0].used*2);
    }
    return DICT_OK;
}

/* Our hash table capability is a power of two */
static unsigned long _dictNextPower(unsigned long size)
{
    unsigned long i = DICT_HT_INITIAL_SIZE;

    if (size >= LONG_MAX) return LONG_MAX;
    while(1) {
        if (i >= size)
            return i;
        i *= 2;
    }
}

/* Returns the index of a free slot that can be populated with
 * a hash entry for the given 'key'.
 * If the key already exists, -1 is returned.
 *
 * Note that if we are in the process of rehashing the hash table, the
 * index is always returned in the context of the second (new) hash table. */
static int _dictKeyIndex(dict *d, const void *key)
{
    unsigned int h, idx, table;
    dictEntry *he;

    /* Expand the hash table if needed */
    if (_dictExpandIfNeeded(d) == DICT_ERR)
        return -1;
    /* Compute the key hash value */
    h = dictHashKey(d, key);
    for (table = 0; table <= 1; table++) {
        idx = h & d->ht[table].sizemask;
        /* Search if this slot does not already contain the given key */
        he = d->ht[table].table[idx];
        while(he) {
            if (key==he->key || dictCompareKeys(d, key, he->key))
                return -1;
            he = he->next;
        }
        if (!dictIsRehashing(d)) break;
    }
    return idx;
}

void dictEmpty(dict *d, void(callback)(void*)) {
    _dictClear(d,&d->ht[0],callback);
    _dictClear(d,&d->ht[1],callback);
    d->rehashidx = -1;
    d->iterators = 0;
}

void dictEnableResize(void) {
    dict_can_resize = 1;
}

void dictDisableResize(void) {
    dict_can_resize = 0;
}

/* ------------------------------- Debugging ---------------------------------*/

#define DICT_STATS_VECTLEN 50
size_t _dictGetStatsHt(char *buf, size_t bufsize, dictht *ht, int tableid) {
    unsigned long i, slots = 0, chainlen, maxchainlen = 0;
    unsigned long totchainlen = 0;
    unsigned long clvector[DICT_STATS_VECTLEN];
    size_t l = 0;

    if (ht->used == 0) {
        return snprintf(buf,bufsize,
            "No stats available for empty dictionaries\n");
    }

    /* Compute stats. */
    for (i = 0; i < DICT_STATS_VECTLEN; i++) clvector[i] = 0;
    for (i = 0; i < ht->size; i++) {
        dictEntry *he;

        if (ht->table[i] == NULL) {
            clvector[0]++;
            continue;
        }
        slots++;
        /* For each hash entry on this slot... */
        chainlen = 0;
        he = ht->table[i];
        while(he) {
            chainlen++;
            he = he->next;
        }
        clvector[(chainlen < DICT_STATS_VECTLEN) ? chainlen : (DICT_STATS_VECTLEN-1)]++;
        if (chainlen > maxchainlen) maxchainlen = chainlen;
        totchainlen += chainlen;
    }

    /* Generate human readable stats. */
    l += snprintf(buf+l,bufsize-l,
        "Hash table %d stats (%s):\n"
        " table size: %ld\n"
        " number of elements: %ld\n"
        " different slots: %ld\n"
        " max chain length: %ld\n"
        " avg chain length (counted): %.02f\n"
        " avg chain length (computed): %.02f\n"
        " Chain length distribution:\n",
        tableid, (tableid == 0) ? "main hash table" : "rehashing target",
        ht->size, ht->used, slots, maxchainlen,
        (float)totchainlen/slots, (float)ht->used/slots);

    for (i = 0; i < DICT_STATS_VECTLEN-1; i++) {
        if (clvector[i] == 0) continue;
        if (l >= bufsize) break;
        l += snprintf(buf+l,bufsize-l,
            "   %s%ld: %ld (%.02f%%)\n",
            (i == DICT_STATS_VECTLEN-1)?">= ":"",
            i, clvector[i], ((float)clvector[i]/ht->size)*100);
    }

    /* Unlike snprintf(), teturn the number of characters actually written. */
    if (bufsize) buf[bufsize-1] = '\0';
    return strlen(buf);
}

void dictGetStats(char *buf, size_t bufsize, dict *d) {
    size_t l;
    char *orig_buf = buf;
    size_t orig_bufsize = bufsize;

    l = _dictGetStatsHt(buf,bufsize,&d->ht[0],0);
    buf += l;
    bufsize -= l;
    if (dictIsRehashing(d) && bufsize > 0) {
        _dictGetStatsHt(buf,bufsize,&d->ht[1],1);
    }
    /* Make sure there is a NULL term at the end. */
    if (orig_bufsize) orig_buf[orig_bufsize-1] = '\0';
}


================================================
FILE: src/vr_dict.h
================================================
#ifndef _VR_DICT_H_
#define _VR_DICT_H_

#include <stdint.h>

#define DICT_OK 0
#define DICT_ERR 1

/* Unused arguments generate annoying warnings... */
#define DICT_NOTUSED(V) ((void) V)

typedef struct dictEntry {
    void *key;
    union {
        void *val;
        uint64_t u64;
        int64_t s64;
        double d;
    } v;
    struct dictEntry *next;
} dictEntry;

typedef struct dictType {
    unsigned int (*hashFunction)(const void *key);
    void *(*keyDup)(void *privdata, const void *key);
    void *(*valDup)(void *privdata, const void *obj);
    int (*keyCompare)(void *privdata, const void *key1, const void *key2);
    void (*keyDestructor)(void *privdata, void *key);
    void (*valDestructor)(void *privdata, void *obj);
} dictType;

/* This is our hash table structure. Every dictionary has two of this as we
 * implement incremental rehashing, for the old to the new table. */
typedef struct dictht {
    dictEntry **table;
    unsigned long size;
    unsigned long sizemask;
    unsigned long used;
} dictht;

typedef struct dict {
    dictType *type;
    void *privdata;
    dictht ht[2];
    long rehashidx; /* rehashing not in progress if rehashidx == -1 */
    int iterators; /* number of iterators currently running */
} dict;

/* If safe is set to 1 this is a safe iterator, that means, you can call
 * dictAdd, dictFind, and other functions against the dictionary even while
 * iterating. Otherwise it is a non safe iterator, and only dictNext()
 * should be called while iterating. */
typedef struct dictIterator {
    dict *d;
    long index;
    int table, safe;
    dictEntry *entry, *nextEntry;
    /* unsafe iterator fingerprint for misuse detection. */
    long long fingerprint;
} dictIterator;

typedef void (dictScanFunction)(void *privdata, const dictEntry *de);

/* This is the initial size of every hash table */
#define DICT_HT_INITIAL_SIZE     4

/* ------------------------------- Macros ------------------------------------*/
#define dictFreeVal(d, entry) \
    if ((d)->type->valDestructor) \
        (d)->type->valDestructor((d)->privdata, (entry)->v.val)

#define dictSetVal(d, entry, _val_) do { \
    if ((d)->type->valDup) \
        entry->v.val = (d)->type->valDup((d)->privdata, _val_); \
    else \
        entry->v.val = (_val_); \
} while(0)

#define dictSetSignedIntegerVal(entry, _val_) \
    do { entry->v.s64 = _val_; } while(0)

#define dictSetUnsignedIntegerVal(entry, _val_) \
    do { entry->v.u64 = _val_; } while(0)

#define dictSetDoubleVal(entry, _val_) \
    do { entry->v.d = _val_; } while(0)

#define dictFreeKey(d, entry) \
    if ((d)->type->keyDestructor) \
        (d)->type->keyDestructor((d)->privdata, (entry)->key)

#define dictSetKey(d, entry, _key_) do { \
    if ((d)->type->keyDup) \
        entry->key = (d)->type->keyDup((d)->privdata, _key_); \
    else \
        entry->key = (_key_); \
} while(0)

#define dictCompareKeys(d, key1, key2) \
    (((d)->type->keyCompare) ? \
        (d)->type->keyCompare((d)->privdata, key1, key2) : \
        (key1) == (key2))

#define dictHashKey(d, key) (d)->type->hashFunction(key)
#define dictGetKey(he) ((he)->key)
#define dictGetVal(he) ((he)->v.val)
#define dictGetSignedIntegerVal(he) ((he)->v.s64)
#define dictGetUnsignedIntegerVal(he) ((he)->v.u64)
#define dictGetDoubleVal(he) ((he)->v.d)
#define dictSlots(d) ((d)->ht[0].size+(d)->ht[1].size)
#define dictSize(d) ((d)->ht[0].used+(d)->ht[1].used)
#define dictIsRehashing(d) ((d)->rehashidx != -1)

/* API */
dict *dictCreate(dictType *type, void *privDataPtr);
int dictExpand(dict *d, unsigned long size);
int dictAdd(dict *d, void *key, void *val);
dictEntry *dictAddRaw(dict *d, void *key);
int dictReplace(dict *d, void *key, void *val);
dictEntry *dictReplaceRaw(dict *d, void *key);
int dictDelete(dict *d, const void *key);
int dictDeleteNoFree(dict *d, const void *key);
void dictRelease(dict *d);
dictEntry * dictFind(dict *d, const void *key);
void *dictFetchValue(dict *d, const void *key);
int dictResize(dict *d);
dictIterator *dictGetIterator(dict *d);
dictIterator *dictGetSafeIterator(dict *d);
dictEntry *dictNext(dictIterator *iter);
void dictReleaseIterator(dictIterator *iter);
dictEntry *dictGetRandomKey(dict *d);
unsigned int dictGetSomeKeys(dict *d, dictEntry **des, unsigned int count);
void dictGetStats(char *buf, size_t bufsize, dict *d);
unsigned int dictGenHashFunction(const void *key, int len);
unsigned int dictGenCaseHashFunction(const unsigned char *buf, int len);
void dictEmpty(dict *d, void(callback)(void*));
void dictEnableResize(void);
void dictDisableResize(void);
int dictRehash(dict *d, int n);
int dictRehashMilliseconds(dict *d, int ms);
void dictSetHashFunctionSeed(unsigned int initval);
unsigned int dictGetHashFunctionSeed(void);
unsigned long dictScan(dict *d, unsigned long v, dictScanFunction *fn, void *privdata);

/* Hash table types */
extern dictType dictTypeHeapStringCopyKey;
extern dictType dictTypeHeapStrings;
extern dictType dictTypeHeapStringCopyKeyValue;

#endif /* _VR_DICT_H_ */


================================================
FILE: src/vr_eventloop.c
================================================
#include <vr_core.h>

int
vr_eventloop_init(vr_eventloop *vel, int filelimit)
{    
    rstatus_t status;
    int maxclients, threads_num;

    if (vel == NULL || filelimit <= 0) {
        return VR_ERROR;
    }

    vr_thread_init(&vel->thread);
    vel->el = NULL;
    vel->hz = 10;
    vel->cronloops = 0;
    vel->unixtime = time(NULL);
    vel->mstime = vr_msec_now();
    vel->lruclock = getLRUClock();
    vel->cb = NULL;
    vel->next_client_id = 1;    /* Client IDs, start from 1 .*/
    vel->current_client = NULL;
    vel->clients = NULL;
    vel->clients_pending_write = NULL;
    vel->clients_to_close = NULL;
    vel->clients_paused = 0;
    vel->clients_pause_end_time = 0;
    vel->stats = NULL;
    vel->resident_set_size = 0;
    vel->dirty = 0;
    vel->bpop_blocked_clients = 0;
    vel->unblocked_clients = NULL;
    vel->clients_waiting_acks = NULL;
    vel->pubsub_channels = NULL;
    vel->pubsub_patterns = NULL;
    vel->notify_keyspace_events = 0;
    vel->cstable = NULL;

    vel->el = aeCreateEventLoop(filelimit);
    if (vel->el == NULL) {
        log_error("create eventloop failed.");
        return VR_ERROR;
    }

    vel->cb = dalloc(sizeof(conn_base));
    if (vel->cb == NULL) {
        log_error("create conn_base failed: out of memory");
        return VR_ENOMEM;
    }
    status = conn_init(vel->cb);
    if (status != VR_OK) {
        log_error("init conn_base failed");
        return VR_ERROR;
    }

    vel->clients = dlistCreate();
    if (vel->clients == NULL) {
        log_error("create list failed: out of memory");
        return VR_ENOMEM;
    }

    vel->clients_pending_write = dlistCreate();
    if (vel->clients_pending_write == NULL) {
        log_error("create list failed: out of memory");
        return VR_ENOMEM;
    }

    vel->clients_to_close = dlistCreate();
    if (vel->clients_to_close == NULL) {
        log_error("create list failed: out of memory");
        return VR_ENOMEM;
    }

    vel->unblocked_clients = dlistCreate();
    if (vel->unblocked_clients == NULL) {
        log_error("create list failed: out of memory");
        return VR_ENOMEM;
    }

    vel->stats = dalloc(sizeof(vr_stats));
    if (vel->stats == NULL) {
        log_error("out of memory");
        return VR_ENOMEM;
    }

    vr_stats_init(vel->stats);

    conf_cache_init(&vel->cc);

    return VR_OK;
}

void
vr_eventloop_deinit(vr_eventloop *vel)
{
    if (vel == NULL) {
        return;
    }

    vr_thread_deinit(&vel->thread);

    if (vel->el != NULL) {
        aeDeleteEventLoop(vel->el);
        vel->el = NULL;
    }

    if (vel->clients != NULL) {
        client *c;
        while (c = dlistPop(vel->clients)) {
            freeClient(c);
        }
        dlistRelease(vel->clients);
        vel->clients = NULL;
    }

    if (vel->clients_pending_write != NULL) {
        client *c;
        while (c = dlistPop(vel->clients_pending_write)) {}
        dlistRelease(vel->clients_pending_write);
        vel->clients_pending_write = NULL;
    }

    if (vel->clients_to_close != NULL) {
        client *c;
        while (c = dlistPop(vel->clients_to_close)) {
            freeClient(c);
        }
        dlistRelease(vel->clients_to_close);
        vel->clients_to_close = NULL;
    }

    if (vel->unblocked_clients != NULL) {
        client *c;
        while (c = dlistPop(vel->unblocked_clients)) {}
        dlistRelease(vel->unblocked_clients);
        vel->unblocked_clients = NULL;
    }

    if (vel->cb != NULL) {
        conn_deinit(vel->cb);
        dfree(vel->cb);
        vel->cb = NULL;
    }

    if (vel->stats != NULL) {
        vr_stats_deinit(vel->stats);
        dfree(vel->stats);
        vel->stats = NULL;
    }

    if (vel->cstable != NULL) {
        commandStatsTableDestroy(vel->cstable);
        vel->cstable = NULL;
    }

    conf_cache_deinit(&vel->cc);
}


================================================
FILE: src/vr_eventloop.h
================================================
#ifndef _VR_EVENTLOOP_H_
#define _VR_EVENTLOOP_H_

typedef struct vr_eventloop {
    vr_thread thread;

    aeEventLoop *el;
    int hz;                     /* cron() calls frequency in hertz */
    int cronloops;              /* Number of times the cron function run */
    
    /* time cache */
    time_t unixtime;            /* Unix time sampled every cron cycle. */
    long long mstime;           /* Like 'unixtime' but with milliseconds resolution. */

    unsigned lruclock:LRU_BITS; /* Clock for LRU eviction */

    conn_base *cb;

    uint64_t next_client_id;    /* Next client unique ID. Incremental. */
    struct client *current_client;     /* Current client, only used on crash report */
    dlist *clients;              /* List of active clients */
    dlist *clients_pending_write;/* There is to write or install handler. */
    dlist *clients_to_close;     /* Clients to close asynchronously */

    int clients_paused;         /* True if clients are currently paused */
    long long clients_pause_end_time; /* Time when we undo clients_paused */

    vr_stats *stats;            /* stats for this thread */
    size_t resident_set_size;   /* RSS sampled in workerCron(). */

    long long dirty;            /* Changes to DB from the last save */

    /* Blocked clients */
    unsigned int bpop_blocked_clients; /* Number of clients blocked by lists */
    dlist *unblocked_clients;        /* list of clients to unblock before next loop */

    /* Synchronous replication. */
    dlist *clients_waiting_acks;     /* Clients waiting in WAIT command. */

    /* Pubsub */
    dict *pubsub_channels;  /* Map channels to list of subscribed clients */
    dlist *pubsub_patterns;  /* A list of pubsub_patterns */
    int notify_keyspace_events; /* Events to propagate via Pub/Sub. This is an
                                   xor of NOTIFY_... flags. */

    conf_cache cc; /* Cache the hot config option to improve vire speed. */

    struct darray *cstable; /* type: commandStats */
}vr_eventloop;

int vr_eventloop_init(vr_eventloop *vel, int filelimit);
void vr_eventloop_deinit(vr_eventloop *vel);

#endif


================================================
FILE: src/vr_hyperloglog.c
================================================
#include <vr_core.h>

#include <stdint.h>
#include <math.h>

/* The Redis HyperLogLog implementation is based on the following ideas:
 *
 * * The use of a 64 bit hash function as proposed in [1], in order to don't
 *   limited to cardinalities up to 10^9, at the cost of just 1 additional
 *   bit per register.
 * * The use of 16384 6-bit registers for a great level of accuracy, using
 *   a total of 12k per key.
 * * The use of the Redis string data type. No new type is introduced.
 * * No attempt is made to compress the data structure as in [1]. Also the
 *   algorithm used is the original HyperLogLog Algorithm as in [2], with
 *   the only difference that a 64 bit hash function is used, so no correction
 *   is performed for values near 2^32 as in [1].
 *
 * [1] Heule, Nunkesser, Hall: HyperLogLog in Practice: Algorithmic
 *     Engineering of a State of The Art Cardinality Estimation Algorithm.
 *
 * [2] P. Flajolet, Éric Fusy, O. Gandouet, and F. Meunier. Hyperloglog: The
 *     analysis of a near-optimal cardinality estimation algorithm.
 *
 * Redis uses two representations:
 *
 * 1) A "dense" representation where every entry is represented by
 *    a 6-bit integer.
 * 2) A "sparse" representation using run length compression suitable
 *    for representing HyperLogLogs with many registers set to 0 in
 *    a memory efficient way.
 *
 *
 * HLL header
 * ===
 *
 * Both the dense and sparse representation have a 16 byte header as follows:
 *
 * +------+---+-----+----------+
 * | HYLL | E | N/U | Cardin.  |
 * +------+---+-----+----------+
 *
 * The first 4 bytes are a magic string set to the bytes "HYLL".
 * "E" is one byte encoding, currently set to HLL_DENSE or
 * HLL_SPARSE. N/U are three not used bytes.
 *
 * The "Cardin." field is a 64 bit integer stored in little endian format
 * with the latest cardinality computed that can be reused if the data
 * structure was not modified since the last computation (this is useful
 * because there are high probabilities that HLLADD operations don't
 * modify the actual data structure and hence the approximated cardinality).
 *
 * When the most significant bit in the most significant byte of the cached
 * cardinality is set, it means that the data structure was modified and
 * we can't reuse the cached value that must be recomputed.
 *
 * Dense representation
 * ===
 *
 * The dense representation used by Redis is the following:
 *
 * +--------+--------+--------+------//      //--+
 * |11000000|22221111|33333322|55444444 ....     |
 * +--------+--------+--------+------//      //--+
 *
 * The 6 bits counters are encoded one after the other starting from the
 * LSB to the MSB, and using the next bytes as needed.
 *
 * Sparse representation
 * ===
 *
 * The sparse representation encodes registers using a run length
 * encoding composed of three opcodes, two using one byte, and one using
 * of two bytes. The opcodes are called ZERO, XZERO and VAL.
 *
 * ZERO opcode is represented as 00xxxxxx. The 6-bit integer represented
 * by the six bits 'xxxxxx', plus 1, means that there are N registers set
 * to 0. This opcode can represent from 1 to 64 contiguous registers set
 * to the value of 0.
 *
 * XZERO opcode is represented by two bytes 01xxxxxx yyyyyyyy. The 14-bit
 * integer represented by the bits 'xxxxxx' as most significant bits and
 * 'yyyyyyyy' as least significant bits, plus 1, means that there are N
 * registers set to 0. This opcode can represent from 0 to 16384 contiguous
 * registers set to the value of 0.
 *
 * VAL opcode is represented as 1vvvvvxx. It contains a 5-bit integer
 * representing the value of a register, and a 2-bit integer representing
 * the number of contiguous registers set to that value 'vvvvv'.
 * To obtain the value and run length, the integers vvvvv and xx must be
 * incremented by one. This opcode can represent values from 1 to 32,
 * repeated from 1 to 4 times.
 *
 * The sparse representation can't represent registers with a value greater
 * than 32, however it is very unlikely that we find such a register in an
 * HLL with a cardinality where the sparse representation is still more
 * memory efficient than the dense representation. When this happens the
 * HLL is converted to the dense representation.
 *
 * The sparse representation is purely positional. For example a sparse
 * representation of an empty HLL is just: XZERO:16384.
 *
 * An HLL having only 3 non-zero registers at position 1000, 1020, 1021
 * respectively set to 2, 3, 3, is represented by the following three
 * opcodes:
 *
 * XZERO:1000 (Registers 0-999 are set to 0)
 * VAL:2,1    (1 register set to value 2, that is register 1000)
 * ZERO:19    (Registers 1001-1019 set to 0)
 * VAL:3,2    (2 registers set to value 3, that is registers 1020,1021)
 * XZERO:15362 (Registers 1022-16383 set to 0)
 *
 * In the example the sparse representation used just 7 bytes instead
 * of 12k in order to represent the HLL registers. In general for low
 * cardinality there is a big win in terms of space efficiency, traded
 * with CPU time since the sparse representation is slower to access:
 *
 * The following table shows average cardinality vs bytes used, 100
 * samples per cardinality (when the set was not representable because
 * of registers with too big value, the dense representation size was used
 * as a sample).
 *
 * 100 267
 * 200 485
 * 300 678
 * 400 859
 * 500 1033
 * 600 1205
 * 700 1375
 * 800 1544
 * 900 1713
 * 1000 1882
 * 2000 3480
 * 3000 4879
 * 4000 6089
 * 5000 7138
 * 6000 8042
 * 7000 8823
 * 8000 9500
 * 9000 10088
 * 10000 10591
 *
 * The dense representation uses 12288 bytes, so there is a big win up to
 * a cardinality of ~2000-3000. For bigger cardinalities the constant times
 * involved in updating the sparse representation is not justified by the
 * memory savings. The exact maximum length of the sparse representation
 * when this implementation switches to the dense representation is
 * configured via the define server.hll_sparse_max_bytes.
 */

struct hllhdr {
    char magic[4];      /* "HYLL" */
    uint8_t encoding;   /* HLL_DENSE or HLL_SPARSE. */
    uint8_t notused[3]; /* Reserved for future use, must be zero. */
    uint8_t card[8];    /* Cached cardinality, little endian. */
    uint8_t registers[]; /* Data bytes. */
};

/* The cached cardinality MSB is used to signal validity of the cached value. */
#define HLL_INVALIDATE_CACHE(hdr) (hdr)->card[7] |= (1<<7)
#define HLL_VALID_CACHE(hdr) (((hdr)->card[7] & (1<<7)) == 0)

#define HLL_P 14 /* The greater is P, the smaller the error. */
#define HLL_REGISTERS (1<<HLL_P) /* With P=14, 16384 registers. */
#define HLL_P_MASK (HLL_REGISTERS-1) /* Mask to index register. */
#define HLL_BITS 6 /* Enough to count up to 63 leading zeroes. */
#define HLL_REGISTER_MAX ((1<<HLL_BITS)-1)
#define HLL_HDR_SIZE sizeof(struct hllhdr)
#define HLL_DENSE_SIZE (HLL_HDR_SIZE+((HLL_REGISTERS*HLL_BITS+7)/8))
#define HLL_DENSE 0 /* Dense encoding. */
#define HLL_SPARSE 1 /* Sparse encoding. */
#define HLL_RAW 255 /* Only used internally, never exposed. */
#define HLL_MAX_ENCODING 1

static char *invalid_hll_err = "-INVALIDOBJ Corrupted HLL object detected\r\n";

/* =========================== Low level bit macros ========================= */

/* Macros to access the dense representation.
 *
 * We need to get and set 6 bit counters in an array of 8 bit bytes.
 * We use macros to make sure the code is inlined since speed is critical
 * especially in order to compute the approximated cardinality in
 * HLLCOUNT where we need to access all the registers at once.
 * For the same reason we also want to avoid conditionals in this code path.
 *
 * +--------+--------+--------+------//
 * |11000000|22221111|33333322|55444444
 * +--------+--------+--------+------//
 *
 * Note: in the above representation the most significant bit (MSB)
 * of every byte is on the left. We start using bits from the LSB to MSB,
 * and so forth passing to the next byte.
 *
 * Example, we want to access to counter at pos = 1 ("111111" in the
 * illustration above).
 *
 * The index of the first byte b0 containing our data is:
 *
 *  b0 = 6 * pos / 8 = 0
 *
 *   +--------+
 *   |11000000|  <- Our byte at b0
 *   +--------+
 *
 * The position of the first bit (counting from the LSB = 0) in the byte
 * is given by:
 *
 *  fb = 6 * pos % 8 -> 6
 *
 * Right shift b0 of 'fb' bits.
 *
 *   +--------+
 *   |11000000|  <- Initial value of b0
 *   |00000011|  <- After right shift of 6 pos.
 *   +--------+
 *
 * Left shift b1 of bits 8-fb bits (2 bits)
 *
 *   +--------+
 *   |22221111|  <- Initial value of b1
 *   |22111100|  <- After left shift of 2 bits.
 *   +--------+
 *
 * OR the two bits, and finally AND with 111111 (63 in decimal) to
 * clean the higher order bits we are not interested in:
 *
 *   +--------+
 *   |00000011|  <- b0 right shifted
 *   |22111100|  <- b1 left shifted
 *   |22111111|  <- b0 OR b1
 *   |  111111|  <- (b0 OR b1) AND 63, our value.
 *   +--------+
 *
 * We can try with a different example, like pos = 0. In this case
 * the 6-bit counter is actually contained in a single byte.
 *
 *  b0 = 6 * pos / 8 = 0
 *
 *   +--------+
 *   |11000000|  <- Our byte at b0
 *   +--------+
 *
 *  fb = 6 * pos % 8 = 0
 *
 *  So we right shift of 0 bits (no shift in practice) and
 *  left shift the next byte of 8 bits, even if we don't use it,
 *  but this has the effect of clearing the bits so the result
 *  will not be affacted after the OR.
 *
 * -------------------------------------------------------------------------
 *
 * Setting the register is a bit more complex, let's assume that 'val'
 * is the value we want to set, already in the right range.
 *
 * We need two steps, in one we need to clear the bits, and in the other
 * we need to bitwise-OR the new bits.
 *
 * Let's try with 'pos' = 1, so our first byte at 'b' is 0,
 *
 * "fb" is 6 in this case.
 *
 *   +--------+
 *   |11000000|  <- Our byte at b0
 *   +--------+
 *
 * To create a AND-mask to clear the bits about this position, we just
 * initialize the mask with the value 63, left shift it of "fs" bits,
 * and finally invert the result.
 *
 *   +--------+
 *   |00111111|  <- "mask" starts at 63
 *   |11000000|  <- "mask" after left shift of "ls" bits.
 *   |00111111|  <- "mask" after invert.
 *   +--------+
 *
 * Now we can bitwise-AND the byte at "b" with the mask, and bitwise-OR
 * it with "val" left-shifted of "ls" bits to set the new bits.
 *
 * Now let's focus on the next byte b1:
 *
 *   +--------+
 *   |22221111|  <- Initial value of b1
 *   +--------+
 *
 * To build the AND mask we start again with the 63 value, right shift
 * it by 8-fb bits, and invert it.
 *
 *   +--------+
 *   |00111111|  <- "mask" set at 2&6-1
 *   |00001111|  <- "mask" after the right shift by 8-fb = 2 bits
 *   |11110000|  <- "mask" after bitwise not.
 *   +--------+
 *
 * Now we can mask it with b+1 to clear the old bits, and bitwise-OR
 * with "val" left-shifted by "rs" bits to set the new value.
 */

/* Note: if we access the last counter, we will also access the b+1 byte
 * that is out of the array, but sds strings always have an implicit null
 * term, so the byte exists, and we can skip the conditional (or the need
 * to allocate 1 byte more explicitly). */

/* Store the value of the register at position 'regnum' into variable 'target'.
 * 'p' is an array of unsigned bytes. */
#define HLL_DENSE_GET_REGISTER(target,p,regnum) do { \
    uint8_t *_p = (uint8_t*) p; \
    unsigned long _byte = regnum*HLL_BITS/8; \
    unsigned long _fb = regnum*HLL_BITS&7; \
    unsigned long _fb8 = 8 - _fb; \
    unsigned long b0 = _p[_byte]; \
    unsigned long b1 = _p[_byte+1]; \
    target = ((b0 >> _fb) | (b1 << _fb8)) & HLL_REGISTER_MAX; \
} while(0)

/* Set the value of the register at position 'regnum' to 'val'.
 * 'p' is an array of unsigned bytes. */
#define HLL_DENSE_SET_REGISTER(p,regnum,val) do { \
    uint8_t *_p = (uint8_t*) p; \
    unsigned long _byte = regnum*HLL_BITS/8; \
    unsigned long _fb = regnum*HLL_BITS&7; \
    unsigned long _fb8 = 8 - _fb; \
    unsigned long _v = val; \
    _p[_byte] &= ~(HLL_REGISTER_MAX << _fb); \
    _p[_byte] |= _v << _fb; \
    _p[_byte+1] &= ~(HLL_REGISTER_MAX >> _fb8); \
    _p[_byte+1] |= _v >> _fb8; \
} while(0)

/* Macros to access the sparse representation.
 * The macros parameter is expected to be an uint8_t pointer. */
#define HLL_SPARSE_XZERO_BIT 0x40 /* 01xxxxxx */
#define HLL_SPARSE_VAL_BIT 0x80 /* 1vvvvvxx */
#define HLL_SPARSE_IS_ZERO(p) (((*(p)) & 0xc0) == 0) /* 00xxxxxx */
#define HLL_SPARSE_IS_XZERO(p) (((*(p)) & 0xc0) == HLL_SPARSE_XZERO_BIT)
#define HLL_SPARSE_IS_VAL(p) ((*(p)) & HLL_SPARSE_VAL_BIT)
#define HLL_SPARSE_ZERO_LEN(p) (((*(p)) & 0x3f)+1)
#define HLL_SPARSE_XZERO_LEN(p) (((((*(p)) & 0x3f) << 8) | (*((p)+1)))+1)
#define HLL_SPARSE_VAL_VALUE(p) ((((*(p)) >> 2) & 0x1f)+1)
#define HLL_SPARSE_VAL_LEN(p) (((*(p)) & 0x3)+1)
#define HLL_SPARSE_VAL_MAX_VALUE 32
#define HLL_SPARSE_VAL_MAX_LEN 4
#define HLL_SPARSE_ZERO_MAX_LEN 64
#define HLL_SPARSE_XZERO_MAX_LEN 16384
#define HLL_SPARSE_VAL_SET(p,val,len) do { \
    *(p) = (((val)-1)<<2|((len)-1))|HLL_SPARSE_VAL_BIT; \
} while(0)
#define HLL_SPARSE_ZERO_SET(p,len) do { \
    *(p) = (len)-1; \
} while(0)
#define HLL_SPARSE_XZERO_SET(p,len) do { \
    int _l = (len)-1; \
    *(p) = (_l>>8) | HLL_SPARSE_XZERO_BIT; \
    *((p)+1) = (_l&0xff); \
} while(0)

/* ========================= HyperLogLog algorithm  ========================= */

/* Our hash function is MurmurHash2, 64 bit version.
 * It was modified for Redis in order to provide the same result in
 * big and little endian archs (endian neutral). */
uint64_t MurmurHash64A (const void * key, int len, unsigned int seed) {
    const uint64_t m = 0xc6a4a7935bd1e995;
    const int r = 47;
    uint64_t h = seed ^ (len * m);
    const uint8_t *data = (const uint8_t *)key;
    const uint8_t *end = data + (len-(len&7));

    while(data != end) {
        uint64_t k;

#if (BYTE_ORDER == LITTLE_ENDIAN)
        k = *((uint64_t*)data);
#else
        k = (uint64_t) data[0];
        k |= (uint64_t) data[1] << 8;
        k |= (uint64_t) data[2] << 16;
        k |= (uint64_t) data[3] << 24;
        k |= (uint64_t) data[4] << 32;
        k |= (uint64_t) data[5] << 40;
        k |= (uint64_t) data[6] << 48;
        k |= (uint64_t) data[7] << 56;
#endif

        k *= m;
        k ^= k >> r;
        k *= m;
        h ^= k;
        h *= m;
        data += 8;
    }

    switch(len & 7) {
    case 7: h ^= (uint64_t)data[6] << 48;
    case 6: h ^= (uint64_t)data[5] << 40;
    case 5: h ^= (uint64_t)data[4] << 32;
    case 4: h ^= (uint64_t)data[3] << 24;
    case 3: h ^= (uint64_t)data[2] << 16;
    case 2: h ^= (uint64_t)data[1] << 8;
    case 1: h ^= (uint64_t)data[0];
            h *= m;
    };

    h ^= h >> r;
    h *= m;
    h ^= h >> r;
    return h;
}

/* Given a string element to add to the HyperLogLog, returns the length
 * of the pattern 000..1 of the element hash. As a side effect 'regp' is
 * set to the register index this element hashes to. */
int hllPatLen(unsigned char *ele, size_t elesize, long *regp) {
    uint64_t hash, bit, index;
    int count;

    /* Count the number of zeroes starting from bit HLL_REGISTERS
     * (that is a power of two corresponding to the first bit we don't use
     * as index). The max run can be 64-P+1 bits.
     *
     * Note that the final "1" ending the sequence of zeroes must be
     * included in the count, so if we find "001" the count is 3, and
     * the smallest count possible is no zeroes at all, just a 1 bit
     * at the first position, that is a count of 1.
     *
     * This may sound like inefficient, but actually in the average case
     * there are high probabilities to find a 1 after a few iterations. */
    hash = MurmurHash64A(ele,elesize,0xadc83b19ULL);
    index = hash & HLL_P_MASK; /* Register index. */
    hash |= ((uint64_t)1<<63); /* Make sure the loop terminates. */
    bit = HLL_REGISTERS; /* First bit not used to address the register. */
    count = 1; /* Initialized to 1 since we count the "00000...1" pattern. */
    while((hash & bit) == 0) {
        count++;
        bit <<= 1;
    }
    *regp = (int) index;
    return count;
}

/* ================== Dense representation implementation  ================== */

/* "Add" the element in the dense hyperloglog data structure.
 * Actually nothing is added, but the max 0 pattern counter of the subset
 * the element belongs to is incremented if needed.
 *
 * 'registers' is expected to have room for HLL_REGISTERS plus an
 * additional byte on the right. This requirement is met by sds strings
 * automatically since they are implicitly null terminated.
 *
 * The function always succeed, however if as a result of the operation
 * the approximated cardinality changed, 1 is returned. Otherwise 0
 * is returned. */
int hllDenseAdd(uint8_t *registers, unsigned char *ele, size_t elesize) {
    uint8_t oldcount, count;
    long index;

    /* Update the register if this element produced a longer run of zeroes. */
    count = hllPatLen(ele,elesize,&index);
    HLL_DENSE_GET_REGISTER(oldcount,registers,index);
    if (count > oldcount) {
        HLL_DENSE_SET_REGISTER(registers,index,count);
        return 1;
    } else {
        return 0;
    }
}

/* Compute SUM(2^-reg) in the dense representation.
 * PE is an array with a pre-computer table of values 2^-reg indexed by reg.
 * As a side effect the integer pointed by 'ezp' is set to the number
 * of zero registers. */
double hllDenseSum(uint8_t *registers, double *PE, int *ezp) {
    double E = 0;
    int j, ez = 0;

    /* Redis default is to use 16384 registers 6 bits each. The code works
     * with other values by modifying the defines, but for our target value
     * we take a faster path with unrolled loops. */
    if (HLL_REGISTERS == 16384 && HLL_BITS == 6) {
        uint8_t *r = registers;
        unsigned long r0, r1, r2, r3, r4, r5, r6, r7, r8, r9,
                      r10, r11, r12, r13, r14, r15;
        for (j = 0; j < 1024; j++) {
            /* Handle 16 registers per iteration. */
            r0 = r[0] & 63; if (r0 == 0) ez++;
            r1 = (r[0] >> 6 | r[1] << 2) & 63; if (r1 == 0) ez++;
            r2 = (r[1] >> 4 | r[2] << 4) & 63; if (r2 == 0) ez++;
            r3 = (r[2] >> 2) & 63; if (r3 == 0) ez++;
            r4 = r[3] & 63; if (r4 == 0) ez++;
            r5 = (r[3] >> 6 | r[4] << 2) & 63; if (r5 == 0) ez++;
            r6 = (r[4] >> 4 | r[5] << 4) & 63; if (r6 == 0) ez++;
            r7 = (r[5] >> 2) & 63; if (r7 == 0) ez++;
            r8 = r[6] & 63; if (r8 == 0) ez++;
            r9 = (r[6] >> 6 | r[7] << 2) & 63; if (r9 == 0) ez++;
            r10 = (r[7] >> 4 | r[8] << 4) & 63; if (r10 == 0) ez++;
            r11 = (r[8] >> 2) & 63; if (r11 == 0) ez++;
            r12 = r[9] & 63; if (r12 == 0) ez++;
            r13 = (r[9] >> 6 | r[10] << 2) & 63; if (r13 == 0) ez++;
            r14 = (r[10] >> 4 | r[11] << 4) & 63; if (r14 == 0) ez++;
            r15 = (r[11] >> 2) & 63; if (r15 == 0) ez++;

            /* Additional parens will allow the compiler to optimize the
             * code more with a loss of precision that is not very relevant
             * here (floating point math is not commutative!). */
            E += (PE[r0] + PE[r1]) + (PE[r2] + PE[r3]) + (PE[r4] + PE[r5]) +
                 (PE[r6] + PE[r7]) + (PE[r8] + PE[r9]) + (PE[r10] + PE[r11]) +
                 (PE[r12] + PE[r13]) + (PE[r14] + PE[r15]);
            r += 12;
        }
    } else {
        for (j = 0; j < HLL_REGISTERS; j++) {
            unsigned long reg;

            HLL_DENSE_GET_REGISTER(reg,registers,j);
            if (reg == 0) {
                ez++;
                /* Increment E at the end of the loop. */
            } else {
                E += PE[reg]; /* Precomputed 2^(-reg[j]). */
            }
        }
        E += ez; /* Add 2^0 'ez' times. */
    }
    *ezp = ez;
    return E;
}

/* ================== Sparse representation implementation  ================= */

/* Convert the HLL with sparse representation given as input in its dense
 * representation. Both representations are represented by SDS strings, and
 * the input representation is freed as a side effect.
 *
 * The function returns VR_OK if the sparse representation was valid,
 * otherwise VR_ERROR is returned if the representation was corrupted. */
int hllSparseToDense(robj *o) {
    sds sparse = o->ptr, dense;
    struct hllhdr *hdr, *oldhdr = (struct hllhdr*)sparse;
    int idx = 0, runlen, regval;
    uint8_t *p = (uint8_t*)sparse, *end = p+sdslen(sparse);

    /* If the representation is already the right one return ASAP. */
    hdr = (struct hllhdr*) sparse;
    if (hdr->encoding == HLL_DENSE) return VR_OK;

    /* Create a string of the right size filled with zero bytes.
     * Note that the cached cardinality is set to 0 as a side effect
     * that is exactly the cardinality of an empty HLL. */
    dense = sdsnewlen(NULL,HLL_DENSE_SIZE);
    hdr = (struct hllhdr*) dense;
    *hdr = *oldhdr; /* This will copy the magic and cached cardinality. */
    hdr->encoding = HLL_DENSE;

    /* Now read the sparse representation and set non-zero registers
     * accordingly. */
    p += HLL_HDR_SIZE;
    while(p < end) {
        if (HLL_SPARSE_IS_ZERO(p)) {
            runlen = HLL_SPARSE_ZERO_LEN(p);
            idx += runlen;
            p++;
        } else if (HLL_SPARSE_IS_XZERO(p)) {
            runlen = HLL_SPARSE_XZERO_LEN(p);
            idx += runlen;
            p += 2;
        } else {
            runlen = HLL_SPARSE_VAL_LEN(p);
            regval = HLL_SPARSE_VAL_VALUE(p);
            while(runlen--) {
                HLL_DENSE_SET_REGISTER(hdr->registers,idx,regval);
                idx++;
            }
            p++;
        }
    }

    /* If the sparse representation was valid, we expect to find idx
     * set to HLL_REGISTERS. */
    if (idx != HLL_REGISTERS) {
        sdsfree(dense);
        return VR_ERROR;
    }

    /* Free the old representation and set the new one. */
    sdsfree(o->ptr);
    o->ptr = dense;
    return VR_OK;
}

/* "Add" the element in the sparse hyperloglog data structure.
 * Actually nothing is added, but the max 0 pattern counter of the subset
 * the element belongs to is incremented if needed.
 *
 * The object 'o' is the String object holding the HLL. The function requires
 * a reference to the object in order to be able to enlarge the string if
 * needed.
 *
 * On success, the function returns 1 if the cardinality changed, or 0
 * if the register for this element was not updated.
 * On error (if the representation is invalid) -1 is returned.
 *
 * As a side effect the function may promote the HLL representation from
 * sparse to dense: this happens when a register requires to be set to a value
 * not representable with the sparse representation, or when the resulting
 * size would be greater than server.hll_sparse_max_bytes. */
int hllSparseAdd(robj *o, unsigned char *ele, size_t elesize) {
    struct hllhdr *hdr;
    uint8_t oldcount, count, *sparse, *end, *p, *prev, *next;
    long index, first, span;
    long is_zero = 0, is_xzero = 0, is_val = 0, runlen = 0;

    /* Update the register if this element produced a longer run of zeroes. */
    count = hllPatLen(ele,elesize,&index);

    /* If the count is too big to be representable by the sparse representation
     * switch to dense representation. */
    if (count > HLL_SPARSE_VAL_MAX_VALUE) goto promote;

    /* When updating a sparse representation, sometimes we may need to
     * enlarge the buffer for up to 3 bytes in the worst case (XZERO split
     * into XZERO-VAL-XZERO). Make sure there is enough space right now
     * so that the pointers we take during the execution of the function
     * will be valid all the time. */
    o->ptr = sdsMakeRoomFor(o->ptr,3);

    /* Step 1: we need to locate the opcode we need to modify to check
     * if a value update is actually needed. */
    sparse = p = ((uint8_t*)o->ptr) + HLL_HDR_SIZE;
    end = p + sdslen(o->ptr) - HLL_HDR_SIZE;

    first = 0;
    prev = NULL; /* Points to previos opcode at the end of the loop. */
    next = NULL; /* Points to the next opcode at the end of the loop. */
    span = 0;
    while(p < end) {
        long oplen;

        /* Set span to the number of registers covered by this opcode.
         *
         * This is the most performance critical loop of the sparse
         * representation. Sorting the conditionals from the most to the
         * least frequent opcode in many-bytes sparse HLLs is faster. */
        oplen = 1;
        if (HLL_SPARSE_IS_ZERO(p)) {
            span = HLL_SPARSE_ZERO_LEN(p);
        } else if (HLL_SPARSE_IS_VAL(p)) {
            span = HLL_SPARSE_VAL_LEN(p);
        } else { /* XZERO. */
            span = HLL_SPARSE_XZERO_LEN(p);
            oplen = 2;
        }
        /* Break if this opcode covers the register as 'index'. */
        if (index <= first+span-1) break;
        prev = p;
        p += oplen;
        first += span;
    }
    if (span == 0) return -1; /* Invalid format. */

    next = HLL_SPARSE_IS_XZERO(p) ? p+2 : p+1;
    if (next >= end) next = NULL;

    /* Cache current opcode type to avoid using the macro again and
     * again for something that will not change.
     * Also cache the run-length of the opcode. */
    if (HLL_SPARSE_IS_ZERO(p)) {
        is_zero = 1;
        runlen = HLL_SPARSE_ZERO_LEN(p);
    } else if (HLL_SPARSE_IS_XZERO(p)) {
        is_xzero = 1;
        runlen = HLL_SPARSE_XZERO_LEN(p);
    } else {
        is_val = 1;
        runlen = HLL_SPARSE_VAL_LEN(p);
    }

    /* Step 2: After the loop:
     *
     * 'first' stores to the index of the first register covered
     *  by the current opcode, which is pointed by 'p'.
     *
     * 'next' ad 'prev' store respectively the next and previous opcode,
     *  or NULL if the opcode at 'p' is respectively the last or first.
     *
     * 'span' is set to the number of registers covered by the current
     *  opcode.
     *
     * There are different cases in order to update the data structure
     * in place without generating it from scratch:
     *
     * A) If it is a VAL opcode already set to a value >= our 'count'
     *    no update is needed, regardless of the VAL run-length field.
     *    In this case PFADD returns 0 since no changes are performed.
     *
     * B) If it is a VAL opcode with len = 1 (representing only our
     *    register) and the value is less than 'count', we just update it
     *    since this is a trivial case. */
    if (is_val) {
        oldcount = HLL_SPARSE_VAL_VALUE(p);
        /* Case A. */
        if (oldcount >= count) return 0;

        /* Case B. */
        if (runlen == 1) {
            HLL_SPARSE_VAL_SET(p,count,1);
            goto updated;
        }
    }

    /* C) Another trivial to handle case is a ZERO opcode with a len of 1.
     * We can just replace it with a VAL opcode with our value and len of 1. */
    if (is_zero && runlen == 1) {
        HLL_SPARSE_VAL_SET(p,count,1);
        goto updated;
    }

    /* D) General case.
     *
     * The other cases are more complex: our register requires to be updated
     * and is either currently represented by a VAL opcode with len > 1,
     * by a ZERO opcode with len > 1, or by an XZERO opcode.
     *
     * In those cases the original opcode must be split into muliple
     * opcodes. The worst case is an XZERO split in the middle resuling into
     * XZERO - VAL - XZERO, so the resulting sequence max length is
     * 5 bytes.
     *
     * We perform the split writing the new sequence into the 'new' buffer
     * with 'newlen' as length. Later the new sequence is inserted in place
     * of the old one, possibly moving what is on the right a few bytes
     * if the new sequence is longer than the older one. */
    uint8_t seq[5], *n = seq;
    int last = first+span-1; /* Last register covered by the sequence. */
    int len;

    if (is_zero || is_xzero) {
        /* Handle splitting of ZERO / XZERO. */
        if (index != first) {
            len = index-first;
            if (len > HLL_SPARSE_ZERO_MAX_LEN) {
                HLL_SPARSE_XZERO_SET(n,len);
                n += 2;
            } else {
                HLL_SPARSE_ZERO_SET(n,len);
                n++;
            }
        }
        HLL_SPARSE_VAL_SET(n,count,1);
        n++;
        if (index != last) {
            len = last-index;
            if (len > HLL_SPARSE_ZERO_MAX_LEN) {
                HLL_SPARSE_XZERO_SET(n,len);
                n += 2;
            } else {
                HLL_SPARSE_ZERO_SET(n,len);
                n++;
            }
        }
    } else {
        /* Handle splitting of VAL. */
        int curval = HLL_SPARSE_VAL_VALUE(p);

        if (index != first) {
            len = index-first;
            HLL_SPARSE_VAL_SET(n,curval,len);
            n++;
        }
        HLL_SPARSE_VAL_SET(n,count,1);
        n++;
        if (index != last) {
            len = last-index;
            HLL_SPARSE_VAL_SET(n,curval,len);
            n++;
        }
    }

    /* Step 3: substitute the new sequence with the old one.
     *
     * Note that we already allocated space on the sds string
     * calling sdsMakeRoomFor(). */
     int seqlen = n-seq;
     int oldlen = is_xzero ? 2 : 1;
     int deltalen = seqlen-oldlen;

     if (deltalen > 0 &&
         sdslen(o->ptr)+deltalen > server.hll_sparse_max_bytes) goto promote;
     if (deltalen && next) memmove(next+deltalen,next,end-next);
     sdsIncrLen(o->ptr,deltalen);
     memcpy(p,seq,seqlen);
     end += deltalen;

updated:
    /* Step 4: Merge adjacent values if possible.
     *
     * The representation was updated, however the resulting representation
     * may not be optimal: adjacent VAL opcodes can sometimes be merged into
     * a single one. */
    p = prev ? prev : sparse;
    int scanlen = 5; /* Scan up to 5 upcodes starting from prev. */
    while (p < end && scanlen--) {
        if (HLL_SPARSE_IS_XZERO(p)) {
            p += 2;
            continue;
        } else if (HLL_SPARSE_IS_ZERO(p)) {
            p++;
            continue;
        }
        /* We need two adjacent VAL opcodes to try a merge, having
         * the same value, and a len that fits the VAL opcode max len. */
        if (p+1 < end && HLL_SPARSE_IS_VAL(p+1)) {
            int v1 = HLL_SPARSE_VAL_VALUE(p);
            int v2 = HLL_SPARSE_VAL_VALUE(p+1);
            if (v1 == v2) {
                int len = HLL_SPARSE_VAL_LEN(p)+HLL_SPARSE_VAL_LEN(p+1);
                if (len <= HLL_SPARSE_VAL_MAX_LEN) {
                    HLL_SPARSE_VAL_SET(p+1,v1,len);
                    memmove(p,p+1,end-p);
                    sdsIncrLen(o->ptr,-1);
                    end--;
                    /* After a merge we reiterate without incrementing 'p'
                     * in order to try to merge the just merged value with
                     * a value on its right. */
                    continue;
                }
            }
        }
        p++;
    }

    /* Invalidate the cached cardinality. */
    hdr = o->ptr;
    HLL_INVALIDATE_CACHE(hdr);
    return 1;

promote: /* Promote to dense representation. */
    if (hllSparseToDense(o) == VR_ERROR) return -1; /* Corrupted HLL. */
    hdr = o->ptr;

    /* We need to call hllDenseAdd() to perform the operation after the
     * conversion. However the result must be 1, since if we need to
     * convert from sparse to dense a register requires to be updated.
     *
     * Note that this in turn means that PFADD will make sure the command
     * is propagated to slaves / AOF, so if there is a sparse -> dense
     * convertion, it will be performed in all the slaves as well. */
    int dense_retval = hllDenseAdd(hdr->registers, ele, elesize);
    ASSERT(dense_retval == 1);
    return dense_retval;
}

/* Compute SUM(2^-reg) in the sparse representation.
 * PE is an array with a pre-computer table of values 2^-reg indexed by reg.
 * As a side effect the integer pointed by 'ezp' is set to the number
 * of zero registers. */
double hllSparseSum(uint8_t *sparse, int sparselen, double *PE, int *ezp, int *invalid) {
    double E = 0;
    int ez = 0, idx = 0, runlen, regval;
    uint8_t *end = sparse+sparselen, *p = sparse;

    while(p < end) {
        if (HLL_SPARSE_IS_ZERO(p)) {
            runlen = HLL_SPARSE_ZERO_LEN(p);
            idx += runlen;
            ez += runlen;
            /* Increment E at the end of the loop. */
            p++;
        } else if (HLL_SPARSE_IS_XZERO(p)) {
            runlen = HLL_SPARSE_XZERO_LEN(p);
            idx += runlen;
            ez += runlen;
            /* Increment E at the end of the loop. */
            p += 2;
        } else {
            runlen = HLL_SPARSE_VAL_LEN(p);
            regval = HLL_SPARSE_VAL_VALUE(p);
            idx += runlen;
            E += PE[regval]*runlen;
            p++;
        }
    }
    if (idx != HLL_REGISTERS && invalid) *invalid = 1;
    E += ez; /* Add 2^0 'ez' times. */
    *ezp = ez;
    return E;
}

/* ========================= HyperLogLog Count ==============================
 * This is the core of the algorithm where the approximated count is computed.
 * The function uses the lower level hllDenseSum() and hllSparseSum() functions
 * as helpers to compute the SUM(2^-reg) part of the computation, which is
 * representation-specific, while all the rest is common. */

/* Implements the SUM operation for uint8_t data type which is only used
 * internally as speedup for PFCOUNT with multiple keys. */
double hllRawSum(uint8_t *registers, double *PE, int *ezp) {
    double E = 0;
    int j, ez = 0;
    uint64_t *word = (uint64_t*) registers;
    uint8_t *bytes;

    for (j = 0; j < HLL_REGISTERS/8; j++) {
        if (*word == 0) {
            ez += 8;
        } else {
            bytes = (uint8_t*) word;
            if (bytes[0]) E += PE[bytes[0]]; else ez++;
            if (bytes[1]) E += PE[bytes[1]]; else ez++;
            if (bytes[2]) E += PE[bytes[2]]; else ez++;
            if (bytes[3]) E += PE[bytes[3]]; else ez++;
            if (bytes[4]) E += PE[bytes[4]]; else ez++;
            if (bytes[5]) E += PE[bytes[5]]; else ez++;
            if (bytes[6]) E += PE[bytes[6]]; else ez++;
            if (bytes[7]) E += PE[bytes[7]]; else ez++;
        }
        word++;
    }
    E += ez; /* 2^(-reg[j]) is 1 when m is 0, add it 'ez' times for every
                zero register in the HLL. */
    *ezp = ez;
    return E;
}

/* Return the approximated cardinality of the set based on the harmonic
 * mean of the registers values. 'hdr' points to the start of the SDS
 * representing the String object holding the HLL representation.
 *
 * If the sparse representation of the HLL object is not valid, the integer
 * pointed by 'invalid' is set to non-zero, otherwise it is left untouched.
 *
 * hllCount() supports a special internal-only encoding of HLL_RAW, that
 * is, hdr->registers will point to an uint8_t array of HLL_REGISTERS element.
 * This is useful in order to speedup PFCOUNT when called against multiple
 * keys (no need to work with 6-bit integers encoding). */
static uint64_t hllCount(struct hllhdr *hdr, int *invalid) {
    double m = HLL_REGISTERS;
    double E, alpha = 0.7213/(1+1.079/m);
    int j, ez; /* Number of registers equal to 0. */

    /* We precompute 2^(-reg[j]) in a small table in order to
     * speedup the computation of SUM(2^-register[0..i]). */
    static int initialized = 0;
    static double PE[64];
    if (!initialized) {
        PE[0] = 1; /* 2^(-reg[j]) is 1 when m is 0. */
        for (j = 1; j < 64; j++) {
            /* 2^(-reg[j]) is the same as 1/2^reg[j]. */
            PE[j] = 1.0/(1ULL << j);
        }
        initialized = 1;
    }

    /* Compute SUM(2^-register[0..i]). */
    if (hdr->encoding == HLL_DENSE) {
        E = hllDenseSum(hdr->registers,PE,&ez);
    } else if (hdr->encoding == HLL_SPARSE) {
        E = hllSparseSum(hdr->registers,
                         sdslen((sds)hdr)-HLL_HDR_SIZE,PE,&ez,invalid);
    } else if (hdr->encoding == HLL_RAW) {
        E = hllRawSum(hdr->registers,PE,&ez);
    } else {
        serverPanic("Unknown HyperLogLog encoding in hllCount()");
    }

    /* Muliply the inverse of E for alpha_m * m^2 to have the raw estimate. */
    E = (1/E)*alpha*m*m;

    /* Use the LINEARCOUNTING algorithm for small cardinalities.
     * For larger values but up to 72000 HyperLogLog raw approximation is
     * used since linear counting error starts to increase. However HyperLogLog
     * shows a strong bias in the range 2.5*16384 - 72000, so we try to
     * compensate for it. */
    if (E < m*2.5 && ez != 0) {
        E = m*log(m/ez); /* LINEARCOUNTING() */
    } else if (m == 16384 && E < 72000) {
        /* We did polynomial regression of the bias for this range, this
         * way we can compute the bias for a given cardinality and correct
         * according to it. Only apply the correction for P=14 that's what
         * we use and the value the correction was verified with. */
        double bias = 5.9119*1.0e-18*(E*E*E*E)
                      -1.4253*1.0e-12*(E*E*E)+
                      1.2940*1.0e-7*(E*E)
                      -5.2921*1.0e-3*E+
                      83.3216;
        E -= E*(bias/100);
    }
    /* We don't apply the correction for E > 1/30 of 2^32 since we use
     * a 64 bit function and 6 bit counters. To apply the correction for
     * 1/30 of 2^64 is not needed since it would require a huge set
     * to approach such a value. */
    return (uint64_t) E;
}

/* Call hllDenseAdd() or hllSparseAdd() according to the HLL encoding. */
int hllAdd(robj *o, unsigned char *ele, size_t elesize) {
    struct hllhdr *hdr = o->ptr;
    switch(hdr->encoding) {
    case HLL_DENSE: return hllDenseAdd(hdr->registers,ele,elesize);
    case HLL_SPARSE: return hllSparseAdd(o,ele,elesize);
    default: return -1; /* Invalid representation. */
    }
}

/* Merge by computing MAX(registers[i],hll[i]) the HyperLogLog 'hll'
 * with an array of uint8_t HLL_REGISTERS registers pointed by 'max'.
 *
 * The hll object must be already validated via isHLLObjectOrReply()
 * or in some other way.
 *
 * If the HyperLogLog is sparse and is found to be invalid, VR_ERROR
 * is returned, otherwise the function always succeeds. */
int hllMerge(uint8_t *max, robj *hll) {
    struct hllhdr *hdr = hll->ptr;
    int i;

    if (hdr->encoding == HLL_DENSE) {
        uint8_t val;

        for (i = 0; i < HLL_REGISTERS; i++) {
            HLL_DENSE_GET_REGISTER(val,hdr->registers,i);
            if (val > max[i]) max[i] = val;
        }
    } else {
        uint8_t *p = hll->ptr, *end = p + sdslen(hll->ptr);
        long runlen, regval;

        p += HLL_HDR_SIZE;
        i = 0;
        while(p < end) {
            if (HLL_SPARSE_IS_ZERO(p)) {
                runlen = HLL_SPARSE_ZERO_LEN(p);
                i += runlen;
                p++;
            } else if (HLL_SPARSE_IS_XZERO(p)) {
                runlen = HLL_SPARSE_XZERO_LEN(p);
                i += runlen;
                p += 2;
            } else {
                runlen = HLL_SPARSE_VAL_LEN(p);
                regval = HLL_SPARSE_VAL_VALUE(p);
                while(runlen--) {
                    if (regval > max[i]) max[i] = regval;
                    i++;
                }
                p++;
            }
        }
        if (i != HLL_REGISTERS) return VR_ERROR;
    }
    return VR_OK;
}

/* ========================== HyperLogLog commands ========================== */

/* Create an HLL object. We always create the HLL using sparse encoding.
 * This will be upgraded to the dense representation as needed. */
robj *createHLLObject(void) {
    robj *o;
    struct hllhdr *hdr;
    sds s;
    uint8_t *p;
    int sparselen = HLL_HDR_SIZE +
                    (((HLL_REGISTERS+(HLL_SPARSE_XZERO_MAX_LEN-1)) /
                     HLL_SPARSE_XZERO_MAX_LEN)*2);
    int aux;

    /* Populate the sparse representation with as many XZERO opcodes as
     * needed to represent all the registers. */
    aux = HLL_REGISTERS;
    s = sdsnewlen(NULL,sparselen);
    p = (uint8_t*)s + HLL_HDR_SIZE;
    while(aux) {
        int xzero = HLL_SPARSE_XZERO_MAX_LEN;
        if (xzero > aux) xzero = aux;
        HLL_SPARSE_XZERO_SET(p,xzero);
        p += 2;
        aux -= xzero;
    }
    ASSERT((p-(uint8_t*)s) == sparselen);

    /* Create the actual object. */
    o = createObject(OBJ_STRING,s);
    hdr = o->ptr;
    memcpy(hdr->magic,"HYLL",4);
    hdr->encoding = HLL_SPARSE;
    return o;
}

/* Check if the object is a String with a valid HLL representation.
 * Return VR_OK if this is true, otherwise reply to the client
 * with an error and return VR_ERROR. */
int isHLLObjectOrReply(client *c, robj *o) {
    struct hllhdr *hdr;

    /* Key exists, check type */
    if (checkType(c,o,OBJ_STRING))
        return VR_ERROR; /* Error already sent. */

    if (stringObjectLen(o) < sizeof(*hdr)) goto invalid;
    hdr = o->ptr;

    /* Magic should be "HYLL". */
    if (hdr->magic[0] != 'H' || hdr->magic[1] != 'Y' ||
        hdr->magic[2] != 'L' || hdr->magic[3] != 'L') goto invalid;

    if (hdr->encoding > HLL_MAX_ENCODING) goto invalid;

    /* Dense representation string length should match exactly. */
    if (hdr->encoding == HLL_DENSE &&
        stringObjectLen(o) != HLL_DENSE_SIZE) goto invalid;

    /* All tests passed. */
    return VR_OK;

invalid:
    addReplySds(c,
        sdsnew("-WRONGTYPE Key is not a valid "
               "HyperLogLog string value.\r\n"));
    return VR_ERROR;
}

/* PFADD var ele ele ele ... ele => :0 or :1 */
void pfaddCommand(client *c) {
    robj *o;
    struct hllhdr *hdr;
    int updated = 0, j;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    o = lookupKeyWrite(c->db,c->argv[1],&expired);
    if (o == NULL) {
        /* Create the key with a string value of the exact length to
         * hold our HLL data structure. sdsnewlen() when NULL is passed
         * is guaranteed to return bytes initialized to zero. */
        o = createHLLObject();
        dbAdd(c->db,c->argv[1],o);
        updated++;
    } else {
        if (isHLLObjectOrReply(c,o) != VR_OK) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            return;
        }
        o = dbUnshareStringValue(c->db,c->argv[1],o);
    }
    /* Perform the low level ADD operation for every element. */
    for (j = 2; j < c->argc; j++) {
        int retval = hllAdd(o, (unsigned char*)c->argv[j]->ptr,
                               sdslen(c->argv[j]->ptr));
        switch(retval) {
        case 1:
            updated++;
            break;
        case -1:
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            addReplySds(c,sdsnew(invalid_hll_err));
            return;
        }
    }
    hdr = o->ptr;
    if (updated) {
        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_STRING,"pfadd",c->argv[1],c->db->id);
        c->vel->dirty++;
        HLL_INVALIDATE_CACHE(hdr);
    }
    addReply(c, updated ? shared.cone : shared.czero);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

/* PFCOUNT var -> approximated cardinality of set. */
void pfcountCommand(client *c) {
    robj *o;
    struct hllhdr *hdr;
    uint64_t card;
    int expired;

    /* Case 1: multi-key keys, cardinality of the union.
     *
     * When multiple keys are specified, PFCOUNT actually computes
     * the cardinality of the merge of the N HLLs specified. */
    if (c->argc > 2) {
        uint8_t max[HLL_HDR_SIZE+HLL_REGISTERS], *registers;
        int j;

        /* Compute an HLL with M[i] = MAX(M[i]_j). */
        memset(max,0,sizeof(max));
        hdr = (struct hllhdr*) max;
        hdr->encoding = HLL_RAW; /* Special internal-only encoding. */
        registers = max + HLL_HDR_SIZE;
        for (j = 1; j < c->argc; j++) {
            /* Check type and size. */
            fetchInternalDbByKey(c,c->argv[j]);
            lockDbRead(c->db);
            robj *o = lookupKeyRead(c->db,c->argv[j]);
            if (o == NULL) {
                unlockDb(c->db);
                continue; /* Assume empty HLL for non existing var.*/
            }
            if (isHLLObjectOrReply(c,o) != VR_OK) {
                unlockDb(c->db);
                return;
            }
            /* Merge with this HLL with our 'max' HHL by setting max[i]
             * to MAX(max[i],hll[i]). */
            if (hllMerge(registers,o) == VR_ERROR) {
                unlockDb(c->db);
                addReplySds(c,sdsnew(invalid_hll_err));
                return;
            }

            unlockDb(c->db);
        }

        /* Compute cardinality of the resulting set. */
        addReplyLongLong(c,hllCount(hdr,NULL));
        return;
    }

    /* Case 2: cardinality of the single HLL.
     *
     * The user specified a single key. Either return the cached value
     * or compute one and update the cache. */
    fetchInternalDbByKey(c,c->argv[1]);
    lockDbWrite(c->db);
    o = lookupKeyWrite(c->db,c->argv[1],&expired);
    if (o == NULL) {
        /* No key? Cardinality is zero since no element was added, otherwise
         * we would have a key as HLLADD creates it as a side effect. */
        addReply(c,shared.czero);
    } else {
        if (isHLLObjectOrReply(c,o) != VR_OK) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            return;
        }
        o = dbUnshareStringValue(c->db,c->argv[1],o);

        /* Check if the cached cardinality is valid. */
        hdr = o->ptr;
        if (HLL_VALID_CACHE(hdr)) {
            /* Just return the cached value. */
            card = (uint64_t)hdr->card[0];
            card |= (uint64_t)hdr->card[1] << 8;
            card |= (uint64_t)hdr->card[2] << 16;
            card |= (uint64_t)hdr->card[3] << 24;
            card |= (uint64_t)hdr->card[4] << 32;
            card |= (uint64_t)hdr->card[5] << 40;
            card |= (uint64_t)hdr->card[6] << 48;
            card |= (uint64_t)hdr->card[7] << 56;
        } else {
            int invalid = 0;
            /* Recompute it and update the cached value. */
            card = hllCount(hdr,&invalid);
            if (invalid) {
                unlockDb(c->db);
                if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
                addReplySds(c,sdsnew(invalid_hll_err));
                return;
            }
            hdr->card[0] = card & 0xff;
            hdr->card[1] = (card >> 8) & 0xff;
            hdr->card[2] = (card >> 16) & 0xff;
            hdr->card[3] = (card >> 24) & 0xff;
            hdr->card[4] = (card >> 32) & 0xff;
            hdr->card[5] = (card >> 40) & 0xff;
            hdr->card[6] = (card >> 48) & 0xff;
            hdr->card[7] = (card >> 56) & 0xff;
            /* This is not considered a read-only command even if the
             * data structure is not modified, since the cached value
             * may be modified and given that the HLL is a Redis string
             * we need to propagate the change. */
            signalModifiedKey(c->db,c->argv[1]);
            server.dirty++;
            c->vel->dirty++;
        }
        addReplyLongLong(c,card);
    }

    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

/* PFMERGE dest src1 src2 src3 ... srcN => OK */
void pfmergeCommand(client *c) {
    uint8_t max[HLL_REGISTERS];
    struct hllhdr *hdr;
    int j;

    /* Compute an HLL with M[i] = MAX(M[i]_j).
     * We we the maximum into the max array of registers. We'll write
     * it to the target variable later. */
    memset(max,0,sizeof(max));
    for (j = 1; j < c->argc; j++) {
        /* Check type and size. */
        robj *o = lookupKeyRead(c->db,c->argv[j]);
        if (o == NULL) continue; /* Assume empty HLL for non existing var. */
        if (isHLLObjectOrReply(c,o) != VR_OK) return;

        /* Merge with this HLL with our 'max' HHL by setting max[i]
         * to MAX(max[i],hll[i]). */
        if (hllMerge(max,o) == VR_ERROR) {
            addReplySds(c,sdsnew(invalid_hll_err));
            return;
        }
    }

    /* Create / unshare the destination key's value if needed. */
    robj *o = lookupKeyWrite(c->db,c->argv[1],NULL);
    if (o == NULL) {
        /* Create the key with a string value of the exact length to
         * hold our HLL data structure. sdsnewlen() when NULL is passed
         * is guaranteed to return bytes initialized to zero. */
        o = createHLLObject();
        dbAdd(c->db,c->argv[1],o);
    } else {
        /* If key exists we are sure it's of the right type/size
         * since we checked when merging the different HLLs, so we
         * don't check again. */
        o = dbUnshareStringValue(c->db,c->argv[1],o);
    }

    /* Only support dense objects as destination. */
    if (hllSparseToDense(o) == VR_ERROR) {
        addReplySds(c,sdsnew(invalid_hll_err));
        return;
    }

    /* Write the resulting HLL to the destination HLL registers and
     * invalidate the cached value. */
    hdr = o->ptr;
    for (j = 0; j < HLL_REGISTERS; j++) {
        HLL_DENSE_SET_REGISTER(hdr->registers,j,max[j]);
    }
    HLL_INVALIDATE_CACHE(hdr);

    signalModifiedKey(c->db,c->argv[1]);
    /* We generate an PFADD event for PFMERGE for semantical simplicity
     * since in theory this is a mass-add of elements. */
    notifyKeyspaceEvent(NOTIFY_STRING,"pfadd",c->argv[1],c->db->id);
    server.dirty++;
    addReply(c,shared.ok);
}

/* ========================== Testing / Debugging  ========================== */

/* PFSELFTEST
 * This command performs a self-test of the HLL registers implementation.
 * Something that is not easy to test from within the outside. */
#define HLL_TEST_CYCLES 1000
void pfselftestCommand(client *c) {
    unsigned int j, i;
    sds bitcounters = sdsnewlen(NULL,HLL_DENSE_SIZE);
    struct hllhdr *hdr = (struct hllhdr*) bitcounters, *hdr2;
    robj *o = NULL;
    uint8_t bytecounters[HLL_REGISTERS];

    /* Test 1: access registers.
     * The test is conceived to test that the different counters of our data
     * structure are accessible and that setting their values both result in
     * the correct value to be retained and not affect adjacent values. */
    for (j = 0; j < HLL_TEST_CYCLES; j++) {
        /* Set the HLL counters and an array of unsigned byes of the
         * same size to the same set of random values. */
        for (i = 0; i < HLL_REGISTERS; i++) {
            unsigned int r = rand() & HLL_REGISTER_MAX;

            bytecounters[i] = r;
            HLL_DENSE_SET_REGISTER(hdr->registers,i,r);
        }
        /* Check that we are able to retrieve the same values. */
        for (i = 0; i < HLL_REGISTERS; i++) {
            unsigned int val;

            HLL_DENSE_GET_REGISTER(val,hdr->registers,i);
            if (val != bytecounters[i]) {
                addReplyErrorFormat(c,
                    "TESTFAILED Register %d should be %d but is %d",
                    i, (int) bytecounters[i], (int) val);
                goto cleanup;
            }
        }
    }

    /* Test 2: approximation error.
     * The test adds unique elements and check that the estimated value
     * is always reasonable bounds.
     *
     * We check that the error is smaller than a few times than the expected
     * standard error, to make it very unlikely for the test to fail because
     * of a "bad" run.
     *
     * The test is performed with both dense and sparse HLLs at the same
     * time also verifying that the computed cardinality is the same. */
    memset(hdr->registers,0,HLL_DENSE_SIZE-HLL_HDR_SIZE);
    o = createHLLObject();
    double relerr = 1.04/sqrt(HLL_REGISTERS);
    int64_t checkpoint = 1;
    uint64_t seed = (uint64_t)rand() | (uint64_t)rand() << 32;
    uint64_t ele;
    for (j = 1; j <= 10000000; j++) {
        ele = j ^ seed;
        hllDenseAdd(hdr->registers,(unsigned char*)&ele,sizeof(ele));
        hllAdd(o,(unsigned char*)&ele,sizeof(ele));

        /* Make sure that for small cardinalities we use sparse
         * encoding. */
        if (j == checkpoint && j < server.hll_sparse_max_bytes/2) {
            hdr2 = o->ptr;
            if (hdr2->encoding != HLL_SPARSE) {
                addReplyError(c, "TESTFAILED sparse encoding not used");
                goto cleanup;
            }
        }

        /* Check that dense and sparse representations agree. */
        if (j == checkpoint && hllCount(hdr,NULL) != hllCount(o->ptr,NULL)) {
                addReplyError(c, "TESTFAILED dense/sparse disagree");
                goto cleanup;
        }

        /* Check error. */
        if (j == checkpoint) {
            int64_t abserr = checkpoint - (int64_t)hllCount(hdr,NULL);
            uint64_t maxerr = ceil(relerr*6*checkpoint);

            /* Adjust the max error we expect for cardinality 10
             * since from time to time it is statistically likely to get
             * much higher error due to collision, resulting into a false
             * positive. */
            if (j == 10) maxerr = 1;

            if (abserr < 0) abserr = -abserr;
            if (abserr > (int64_t)maxerr) {
                addReplyErrorFormat(c,
                    "TESTFAILED Too big error. card:%llu abserr:%llu",
                    (unsigned long long) checkpoint,
                    (unsigned long long) abserr);
                goto cleanup;
            }
            checkpoint *= 10;
        }
    }

    /* Success! */
    addReply(c,shared.ok);

cleanup:
    sdsfree(bitcounters);
    if (o) decrRefCount(o);
}

/* PFDEBUG <subcommand> <key> ... args ...
 * Different debugging related operations about the HLL implementation. */
void pfdebugCommand(client *c) {
    char *cmd = c->argv[1]->ptr;
    struct hllhdr *hdr;
    robj *o;
    int j;

    o = lookupKeyWrite(c->db,c->argv[2],NULL);
    if (o == NULL) {
        addReplyError(c,"The specified key does not exist");
        return;
    }
    if (isHLLObjectOrReply(c,o) != VR_OK) return;
    o = dbUnshareStringValue(c->db,c->argv[2],o);
    hdr = o->ptr;

    /* PFDEBUG GETREG <key> */
    if (!strcasecmp(cmd,"getreg")) {
        if (c->argc != 3) goto arityerr;

        if (hdr->encoding == HLL_SPARSE) {
            if (hllSparseToDense(o) == VR_ERROR) {
                addReplySds(c,sdsnew(invalid_hll_err));
                return;
            }
            server.dirty++; /* Force propagation on encoding change. */
        }

        hdr = o->ptr;
        addReplyMultiBulkLen(c,HLL_REGISTERS);
        for (j = 0; j < HLL_REGISTERS; j++) {
            uint8_t val;

            HLL_DENSE_GET_REGISTER(val,hdr->registers,j);
            addReplyLongLong(c,val);
        }
    }
    /* PFDEBUG DECODE <key> */
    else if (!strcasecmp(cmd,"decode")) {
        if (c->argc != 3) goto arityerr;

        uint8_t *p = o->ptr, *end = p+sdslen(o->ptr);
        sds decoded = sdsempty();

        if (hdr->encoding != HLL_SPARSE) {
            addReplyError(c,"HLL encoding is not sparse");
            return;
        }

        p += HLL_HDR_SIZE;
        while(p < end) {
            int runlen, regval;

            if (HLL_SPARSE_IS_ZERO(p)) {
                runlen = HLL_SPARSE_ZERO_LEN(p);
                p++;
                decoded = sdscatprintf(decoded,"z:%d ",runlen);
            } else if (HLL_SPARSE_IS_XZERO(p)) {
                runlen = HLL_SPARSE_XZERO_LEN(p);
                p += 2;
                decoded = sdscatprintf(decoded,"Z:%d ",runlen);
            } else {
                runlen = HLL_SPARSE_VAL_LEN(p);
                regval = HLL_SPARSE_VAL_VALUE(p);
                p++;
                decoded = sdscatprintf(decoded,"v:%d,%d ",regval,runlen);
            }
        }
        decoded = sdstrim(decoded," ");
        addReplyBulkCBuffer(c,decoded,sdslen(decoded));
        sdsfree(decoded);
    }
    /* PFDEBUG ENCODING <key> */
    else if (!strcasecmp(cmd,"encoding")) {
        char *encodingstr[2] = {"dense","sparse"};
        if (c->argc != 3) goto arityerr;

        addReplyStatus(c,encodingstr[hdr->encoding]);
    }
    /* PFDEBUG TODENSE <key> */
    else if (!strcasecmp(cmd,"todense")) {
        int conv = 0;
        if (c->argc != 3) goto arityerr;

        if (hdr->encoding == HLL_SPARSE) {
            if (hllSparseToDense(o) == VR_ERROR) {
                addReplySds(c,sdsnew(invalid_hll_err));
                return;
            }
            conv = 1;
            server.dirty++; /* Force propagation on encoding change. */
        }
        addReply(c,conv ? shared.cone : shared.czero);
    } else {
        addReplyErrorFormat(c,"Unknown PFDEBUG subcommand '%s'", cmd);
    }
    return;

arityerr:
    addReplyErrorFormat(c,
        "Wrong number of arguments for the '%s' subcommand",cmd);
}


================================================
FILE: src/vr_hyperloglog.h
================================================
#ifndef _VR_HYPERLOGLOG_H_
#define _VR_HYPERLOGLOG_H_

uint64_t MurmurHash64A (const void * key, int len, unsigned int seed);
int hllPatLen(unsigned char *ele, size_t elesize, long *regp);
int hllDenseAdd(uint8_t *registers, unsigned char *ele, size_t elesize);
double hllDenseSum(uint8_t *registers, double *PE, int *ezp);
int hllSparseToDense(robj *o);
int hllSparseAdd(robj *o, unsigned char *ele, size_t elesize);
double hllSparseSum(uint8_t *sparse, int sparselen, double *PE, int *ezp, int *invalid);
double hllRawSum(uint8_t *registers, double *PE, int *ezp);
int hllAdd(robj *o, unsigned char *ele, size_t elesize);
int hllMerge(uint8_t *max, robj *hll);
robj *createHLLObject(void);
int isHLLObjectOrReply(struct client *c, robj *o);
void pfaddCommand(struct client *c);
void pfcountCommand(struct client *c);
void pfmergeCommand(struct client *c);
void pfselftestCommand(struct client *c);
void pfdebugCommand(struct client *c);

#endif


================================================
FILE: src/vr_intset.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#include <vr_core.h>

/* Note that these encodings are ordered, so:
 * INTSET_ENC_INT16 < INTSET_ENC_INT32 < INTSET_ENC_INT64. */
#define INTSET_ENC_INT16 (sizeof(int16_t))
#define INTSET_ENC_INT32 (sizeof(int32_t))
#define INTSET_ENC_INT64 (sizeof(int64_t))

/* Return the required encoding for the provided value. */
static uint8_t _intsetValueEncoding(int64_t v) {
    if (v < INT32_MIN || v > INT32_MAX)
        return INTSET_ENC_INT64;
    else if (v < INT16_MIN || v > INT16_MAX)
        return INTSET_ENC_INT32;
    else
        return INTSET_ENC_INT16;
}

/* Return the value at pos, given an encoding. */
static int64_t _intsetGetEncoded(intset *is, int pos, uint8_t enc) {
    int64_t v64;
    int32_t v32;
    int16_t v16;

    if (enc == INTSET_ENC_INT64) {
        memcpy(&v64,((int64_t*)is->contents)+pos,sizeof(v64));
        memrev64ifbe(&v64);
        return v64;
    } else if (enc == INTSET_ENC_INT32) {
        memcpy(&v32,((int32_t*)is->contents)+pos,sizeof(v32));
        memrev32ifbe(&v32);
        return v32;
    } else {
        memcpy(&v16,((int16_t*)is->contents)+pos,sizeof(v16));
        memrev16ifbe(&v16);
        return v16;
    }
}

/* Return the value at pos, using the configured encoding. */
static int64_t _intsetGet(intset *is, int pos) {
    return _intsetGetEncoded(is,pos,intrev32ifbe(is->encoding));
}

/* Set the value at pos, using the configured encoding. */
static void _intsetSet(intset *is, int pos, int64_t value) {
    uint32_t encoding = intrev32ifbe(is->encoding);

    if (encoding == INTSET_ENC_INT64) {
        ((int64_t*)is->contents)[pos] = value;
        memrev64ifbe(((int64_t*)is->contents)+pos);
    } else if (encoding == INTSET_ENC_INT32) {
        ((int32_t*)is->contents)[pos] = value;
        memrev32ifbe(((int32_t*)is->contents)+pos);
    } else {
        ((int16_t*)is->contents)[pos] = value;
        memrev16ifbe(((int16_t*)is->contents)+pos);
    }
}

/* Create an empty intset. */
intset *intsetNew(void) {
    intset *is = dalloc(sizeof(intset));
    is->encoding = intrev32ifbe(INTSET_ENC_INT16);
    is->length = 0;
    return is;
}

/* Resize the intset */
static intset *intsetResize(intset *is, uint32_t len) {
    uint32_t size = len*intrev32ifbe(is->encoding);
    is = drealloc(is,sizeof(intset)+size);
    return is;
}

/* Search for the position of "value". Return 1 when the value was found and
 * sets "pos" to the position of the value within the intset. Return 0 when
 * the value is not present in the intset and sets "pos" to the position
 * where "value" can be inserted. */
static uint8_t intsetSearch(intset *is, int64_t value, uint32_t *pos) {
    int min = 0, max = intrev32ifbe(is->length)-1, mid = -1;
    int64_t cur = -1;

    /* The value can never be found when the set is empty */
    if (intrev32ifbe(is->length) == 0) {
        if (pos) *pos = 0;
        return 0;
    } else {
        /* Check for the case where we know we cannot find the value,
         * but do know the insert position. */
        if (value > _intsetGet(is,intrev32ifbe(is->length)-1)) {
            if (pos) *pos = intrev32ifbe(is->length);
            return 0;
        } else if (value < _intsetGet(is,0)) {
            if (pos) *pos = 0;
            return 0;
        }
    }

    while(max >= min) {
        mid = ((unsigned int)min + (unsigned int)max) >> 1;
        cur = _intsetGet(is,mid);
        if (value > cur) {
            min = mid+1;
        } else if (value < cur) {
            max = mid-1;
        } else {
            break;
        }
    }

    if (value == cur) {
        if (pos) *pos = mid;
        return 1;
    } else {
        if (pos) *pos = min;
        return 0;
    }
}

/* Upgrades the intset to a larger encoding and inserts the given integer. */
static intset *intsetUpgradeAndAdd(intset *is, int64_t value) {
    uint8_t curenc = intrev32ifbe(is->encoding);
    uint8_t newenc = _intsetValueEncoding(value);
    int length = intrev32ifbe(is->length);
    int prepend = value < 0 ? 1 : 0;

    /* First set new encoding and resize */
    is->encoding = intrev32ifbe(newenc);
    is = intsetResize(is,intrev32ifbe(is->length)+1);

    /* Upgrade back-to-front so we don't overwrite values.
     * Note that the "prepend" variable is used to make sure we have an empty
     * space at either the beginning or the end of the intset. */
    while(length--)
        _intsetSet(is,length+prepend,_intsetGetEncoded(is,length,curenc));

    /* Set the value at the beginning or the end. */
    if (prepend)
        _intsetSet(is,0,value);
    else
        _intsetSet(is,intrev32ifbe(is->length),value);
    is->length = intrev32ifbe(intrev32ifbe(is->length)+1);
    return is;
}

static void intsetMoveTail(intset *is, uint32_t from, uint32_t to) {
    void *src, *dst;
    uint32_t bytes = intrev32ifbe(is->length)-from;
    uint32_t encoding = intrev32ifbe(is->encoding);

    if (encoding == INTSET_ENC_INT64) {
        src = (int64_t*)is->contents+from;
        dst = (int64_t*)is->contents+to;
        bytes *= sizeof(int64_t);
    } else if (encoding == INTSET_ENC_INT32) {
        src = (int32_t*)is->contents+from;
        dst = (int32_t*)is->contents+to;
        bytes *= sizeof(int32_t);
    } else {
        src = (int16_t*)is->contents+from;
        dst = (int16_t*)is->contents+to;
        bytes *= sizeof(int16_t);
    }
    memmove(dst,src,bytes);
}

/* Insert an integer in the intset */
intset *intsetAdd(intset *is, int64_t value, uint8_t *success) {
    uint8_t valenc = _intsetValueEncoding(value);
    uint32_t pos;
    if (success) *success = 1;

    /* Upgrade encoding if necessary. If we need to upgrade, we know that
     * this value should be either appended (if > 0) or prepended (if < 0),
     * because it lies outside the range of existing values. */
    if (valenc > intrev32ifbe(is->encoding)) {
        /* This always succeeds, so we don't need to curry *success. */
        return intsetUpgradeAndAdd(is,value);
    } else {
        /* Abort if the value is already present in the set.
         * This call will populate "pos" with the right position to insert
         * the value when it cannot be found. */
        if (intsetSearch(is,value,&pos)) {
            if (success) *success = 0;
            return is;
        }

        is = intsetResize(is,intrev32ifbe(is->length)+1);
        if (pos < intrev32ifbe(is->length)) intsetMoveTail(is,pos,pos+1);
    }

    _intsetSet(is,pos,value);
    is->length = intrev32ifbe(intrev32ifbe(is->length)+1);
    return is;
}

/* Delete integer from intset */
intset *intsetRemove(intset *is, int64_t value, int *success) {
    uint8_t valenc = _intsetValueEncoding(value);
    uint32_t pos;
    if (success) *success = 0;

    if (valenc <= intrev32ifbe(is->encoding) && intsetSearch(is,value,&pos)) {
        uint32_t len = intrev32ifbe(is->length);

        /* We know we can delete */
        if (success) *success = 1;

        /* Overwrite value with tail and update length */
        if (pos < (len-1)) intsetMoveTail(is,pos+1,pos);
        is = intsetResize(is,len-1);
        is->length = intrev32ifbe(len-1);
    }
    return is;
}

/* Determine whether a value belongs to this set */
uint8_t intsetFind(intset *is, int64_t value) {
    uint8_t valenc = _intsetValueEncoding(value);
    return valenc <= intrev32ifbe(is->encoding) && intsetSearch(is,value,NULL);
}

/* Return random member */
int64_t intsetRandom(intset *is) {
    return _intsetGet(is,rand()%intrev32ifbe(is->length));
}

/* Sets the value to the value at the given position. When this position is
 * out of range the function returns 0, when in range it returns 1. */
uint8_t intsetGet(intset *is, uint32_t pos, int64_t *value) {
    if (pos < intrev32ifbe(is->length)) {
        *value = _intsetGet(is,pos);
        return 1;
    }
    return 0;
}

/* Return intset length */
uint32_t intsetLen(intset *is) {
    return intrev32ifbe(is->length);
}

/* Return intset blob size in bytes. */
size_t intsetBlobLen(intset *is) {
    return sizeof(intset)+intrev32ifbe(is->length)*intrev32ifbe(is->encoding);
}


================================================
FILE: src/vr_intset.h
================================================
#ifndef _VR_INTSET_H_
#define _VR_INTSET_H_

#include <stdint.h>

typedef struct intset {
    uint32_t encoding;
    uint32_t length;
    int8_t contents[];
} intset;

intset *intsetNew(void);
intset *intsetAdd(intset *is, int64_t value, uint8_t *success);
intset *intsetRemove(intset *is, int64_t value, int *success);
uint8_t intsetFind(intset *is, int64_t value);
int64_t intsetRandom(intset *is);
uint8_t intsetGet(intset *is, uint32_t pos, int64_t *value);
uint32_t intsetLen(intset *is);
size_t intsetBlobLen(intset *is);

#endif


================================================
FILE: src/vr_listen.c
================================================
#include <sys/stat.h>
#include <sys/un.h>

#include <vr_core.h>

vr_listen *
vr_listen_create(sds listen_str)
{
    rstatus_t status;
    vr_listen *vlisten;
    uint8_t *p, *name;
    uint32_t namelen;

    if (listen_str == NULL) {
        return NULL;
    }

    vlisten = dalloc(sizeof(struct vr_listen));
    if (vlisten == NULL) {
        return NULL;
    }

    vlisten->name = NULL;
    vlisten->port = 0;
    memset(&vlisten->info, 0, sizeof(vlisten->info));
    vlisten->sd = -1;
    
    if (listen_str == '/') {
        uint8_t *q, *start, *perm;
        uint32_t permlen;

        /* parse "socket_path permissions" from the end */
        p = listen_str + sdslen(listen_str) - 1;
        start = listen_str;
        q = vr_strrchr(p, start, ' ');
        if (q == NULL) {
            /* no permissions field, so use defaults */
            name = listen_str;
            namelen = sdslen(listen_str);
        } else {
            perm = q + 1;
            permlen = (uint32_t)(p - perm + 1);

            p = q - 1;
            name = start;
            namelen = (uint32_t)(p - start + 1);

            errno = 0;
            vlisten->perm = (mode_t)strtol((char *)perm, NULL, 8);
            if (errno || vlisten->perm > 0777) {
                log_error("config file has an invalid file permission in \"socket_path permission\" format string");
                vr_listen_destroy(vlisten);
                return NULL;
            }
        }
    } else {
        uint8_t *q, *start, *port;
        uint32_t portlen;

        /* parse "hostname:port" from the end */
        p = listen_str + sdslen(listen_str) - 1;
        start = listen_str;
        q = vr_strrchr(p, start, ':');
        if (q == NULL) {
            log_error("config file has an invalid \"hostname:port\" format string");
            vr_listen_destroy(vlisten);
            return NULL;
        }

        port = q + 1;
        portlen = (uint32_t)(p - port + 1);

        p = q - 1;

        name = start;
        namelen = (uint32_t)(p - start + 1);

        vlisten->port = vr_atoi(port, portlen);
        if (vlisten->port < 0 || !vr_valid_port(vlisten->port)) {
            log_error("config file has an invalid port in \"hostname:port\" format string");
            vr_listen_destroy(vlisten);
            return NULL;
        }
    }

    vlisten->name = sdsnewlen(name, namelen);
    if (vlisten->name == NULL) {
        log_error("create a sds string failed: out of memory.");
        vr_listen_destroy(vlisten);
        return NULL;
    }

    status = vr_resolve(vlisten->name, vlisten->port, &vlisten->info);
    if (status != VR_OK) {
        vr_listen_destroy(vlisten);
        return NULL;
    }

    return vlisten;
}

void
vr_listen_destroy(vr_listen *vliston)
{
    if (vliston == NULL) {
        return;
    }

    if (vliston->name) {
        sdsfree(vliston->name);
        vliston->name = NULL;
    }

    if (vliston->sd > 0) {
        close(vliston->sd);
        vliston->sd = -1;
    }
    
    dfree(vliston);
}

static rstatus_t
vr_listen_reuse(vr_listen *p)
{
    rstatus_t status;
    struct sockaddr_un *un;

    switch (p->info.family) {
    case AF_INET:
    case AF_INET6:
        status = vr_set_reuseaddr(p->sd);
        break;

    case AF_UNIX:
        /*
         * bind() will fail if the pathname already exist. So, we call unlink()
         * to delete the pathname, in case it already exists. If it does not
         * exist, unlink() returns error, which we ignore
         */
        un = (struct sockaddr_un *) &p->info.addr;
        unlink(un->sun_path);
        status = VR_OK;
        break;

    default:
        NOT_REACHED();
        status = VR_ERROR;
    }

    return status;
}

rstatus_t
vr_listen_begin(vr_listen *vlisten)
{
    rstatus_t status;

    vlisten->sd = socket(vlisten->info.family, SOCK_STREAM, 0);
    if (vlisten->sd < 0) {
        log_error("socket failed: %s", strerror(errno));
        return VR_ERROR;
    }

    status = vr_listen_reuse(vlisten);
    if (status < 0) {
        log_error("reuse of addr %s for listening on p %d failed: %s",
                  vlisten->name, vlisten->sd, strerror(errno));
        return VR_ERROR;
    }

    status = bind(vlisten->sd, (struct sockaddr *)&vlisten->info.addr, vlisten->info.addrlen);
    if (status < 0) {
        log_error("bind on p %d to addr %s failed: %s", vlisten->sd,
                  vlisten->name, strerror(errno));
        return VR_ERROR;
    }

    if (vlisten->info.family == AF_UNIX && vlisten->perm) {
        struct sockaddr_un *un = (struct sockaddr_un *)&vlisten->info.addr;
        status = chmod(un->sun_path, vlisten->perm);
        if (status < 0) {
            log_error("chmod on p %d on addr %s failed: %s", vlisten->sd,
                      vlisten->name, strerror(errno));
            return VR_ERROR;
        }
    }

    status = listen(vlisten->sd, 512);
    if (status < 0) {
        log_error("listen on p %d on addr %s failed: %s", vlisten->sd,
                  vlisten->name, strerror(errno));
        return VR_ERROR;
    }

    status = vr_set_nonblocking(vlisten->sd);
    if (status < 0) {
        log_error("set nonblock on p %d on addr %s failed: %s", vlisten->sd,
                  vlisten->name, strerror(errno));
        return VR_ERROR;
    }

    return VR_OK;
}

int
vr_listen_accept(vr_listen *vlisten)
{
    rstatus_t status;
    int sd;
    int maxclients;
    
    ASSERT(vlisten->sd > 0);
    
    log_debug(LOG_DEBUG,"client_accept");

    conf_server_get(CONFIG_SOPN_MAXCLIENTS,&maxclients);
    for (;;) {
        sd = accept(vlisten->sd, NULL, NULL);
        if (sd < 0) {
            if (errno == EINTR) {
                log_debug(LOG_VERB, "accept on p %d not ready - eintr", vlisten->sd);
                continue;
            }

            if (errno == EAGAIN || errno == EWOULDBLOCK || errno == ECONNABORTED) {
                log_debug(LOG_VERB, "accept on p %d not ready - eagain", vlisten->sd);
                return -1;
            }
            
            if (errno == EMFILE || errno == ENFILE) {
                log_debug(LOG_CRIT, "accept on p %d "
                          "max client connections %d "
                          "curr client connections %d failed: %s",
                          vlisten->sd, maxclients, 
                          current_clients(), strerror(errno));
                return -1;
            }

            log_warn("accept on p %d failed: %s", vlisten->sd, strerror(errno));

            return -1;
        }

        break;
    }

    if (current_clients() >= maxclients) {
        log_debug(LOG_CRIT, "client connections %d exceed limit %d",
                  current_clients(), maxclients);
        status = close(sd);
        if (status < 0) {
            log_error("close c %d failed, ignored: %s", sd, strerror(errno));
        }

        update_stats_add(master.vel.stats, rejected_conn, 1);
        
        return -1;
    }

    return sd;
}


================================================
FILE: src/vr_listen.h
================================================
#ifndef _VR_LISTEN_H_
#define _VR_LISTEN_H_

typedef struct vr_listen {
    sds name;               /* hostname:port */
    int port;               /* port */
    mode_t perm;            /* socket permissions */
    struct sockinfo info;   /* listen socket info */
    int sd;                 /* socket descriptor */
}vr_listen;

vr_listen *vr_listen_create(sds linten_str);
void vr_listen_destroy(vr_listen *vliston);
rstatus_t vr_listen_begin(struct vr_listen *vlisten);
int vr_listen_accept(vr_listen *vlisten);

#endif


================================================
FILE: src/vr_lzf.h
================================================
#ifndef _VR_LZF_H_
#define _VR_LZF_H_

/***********************************************************************
**
**	lzf -- an extremely fast/free compression/decompression-method
**	http://liblzf.plan9.de/
**
**	This algorithm is believed to be patent-free.
**
***********************************************************************/

#define LZF_VERSION 0x0105 /* 1.5, API version */

/*
 * Compress in_len bytes stored at the memory block starting at
 * in_data and write the result to out_data, up to a maximum length
 * of out_len bytes.
 *
 * If the output buffer is not large enough or any error occurs return 0,
 * otherwise return the number of bytes used, which might be considerably
 * more than in_len (but less than 104% of the original size), so it
 * makes sense to always use out_len == in_len - 1), to ensure _some_
 * compression, and store the data uncompressed otherwise (with a flag, of
 * course.
 *
 * lzf_compress might use different algorithms on different systems and
 * even different runs, thus might result in different compressed strings
 * depending on the phase of the moon or similar factors. However, all
 * these strings are architecture-independent and will result in the
 * original data when decompressed using lzf_decompress.
 *
 * The buffers must not be overlapping.
 *
 * If the option LZF_STATE_ARG is enabled, an extra argument must be
 * supplied which is not reflected in this header file. Refer to lzfP.h
 * and lzf_c.c.
 *
 */
unsigned int
lzf_compress (const void *const in_data,  unsigned int in_len,
              void             *out_data, unsigned int out_len);

/*
 * Decompress data compressed with some version of the lzf_compress
 * function and stored at location in_data and length in_len. The result
 * will be stored at out_data up to a maximum of out_len characters.
 *
 * If the output buffer is not large enough to hold the decompressed
 * data, a 0 is returned and errno is set to E2BIG. Otherwise the number
 * of decompressed bytes (i.e. the original length of the data) is
 * returned.
 *
 * If an error in the compressed data is detected, a zero is returned and
 * errno is set to EINVAL.
 *
 * This function is very fast, about as fast as a copying loop.
 */
unsigned int
lzf_decompress (const void *const in_data,  unsigned int in_len,
                void             *out_data, unsigned int out_len);

#endif


================================================
FILE: src/vr_lzfP.h
================================================
#ifndef _VR_LZFP_H_
#define _VR_LZFP_H_

#define STANDALONE 1 /* at the moment, this is ok. */

#ifndef STANDALONE
#include <vr_lzf.h>
#endif

/*
 * Size of hashtable is (1 << HLOG) * sizeof (char *)
 * decompression is independent of the hash table size
 * the difference between 15 and 14 is very small
 * for small blocks (and 14 is usually a bit faster).
 * For a low-memory/faster configuration, use HLOG == 13;
 * For best compression, use 15 or 16 (or more, up to 22).
 */
#ifndef HLOG
# define HLOG 16
#endif

/*
 * Sacrifice very little compression quality in favour of compression speed.
 * This gives almost the same compression as the default code, and is
 * (very roughly) 15% faster. This is the preferred mode of operation.
 */
#ifndef VERY_FAST
# define VERY_FAST 1
#endif

/*
 * Sacrifice some more compression quality in favour of compression speed.
 * (roughly 1-2% worse compression for large blocks and
 * 9-10% for small, redundant, blocks and >>20% better speed in both cases)
 * In short: when in need for speed, enable this for binary data,
 * possibly disable this for text data.
 */
#ifndef ULTRA_FAST
# define ULTRA_FAST 0
#endif

/*
 * Unconditionally aligning does not cost very much, so do it if unsure
 */
#ifndef STRICT_ALIGN
# define STRICT_ALIGN !(defined(__i386) || defined (__amd64))
#endif

/*
 * You may choose to pre-set the hash table (might be faster on some
 * modern cpus and large (>>64k) blocks, and also makes compression
 * deterministic/repeatable when the configuration otherwise is the same).
 */
#ifndef INIT_HTAB
# define INIT_HTAB 0
#endif

/*
 * Avoid assigning values to errno variable? for some embedding purposes
 * (linux kernel for example), this is necessary. NOTE: this breaks
 * the documentation in lzf.h. Avoiding errno has no speed impact.
 */
#ifndef AVOID_ERRNO
# define AVOID_ERRNO 0
#endif

/*
 * Whether to pass the LZF_STATE variable as argument, or allocate it
 * on the stack. For small-stack environments, define this to 1.
 * NOTE: this breaks the prototype in lzf.h.
 */
#ifndef LZF_STATE_ARG
# define LZF_STATE_ARG 0
#endif

/*
 * Whether to add extra checks for input validity in lzf_decompress
 * and return EINVAL if the input stream has been corrupted. This
 * only shields against overflowing the input buffer and will not
 * detect most corrupted streams.
 * This check is not normally noticeable on modern hardware
 * (<1% slowdown), but might slow down older cpus considerably.
 */
#ifndef CHECK_INPUT
# define CHECK_INPUT 1
#endif

/*
 * Whether to store pointers or offsets inside the hash table. On
 * 64 bit architetcures, pointers take up twice as much space,
 * and might also be slower. Default is to autodetect.
 */
/*#define LZF_USER_OFFSETS autodetect */

/*****************************************************************************/
/* nothing should be changed below */

#ifdef __cplusplus
# include <cstring>
# include <climits>
using namespace std;
#else
# include <string.h>
# include <limits.h>
#endif

#ifndef LZF_USE_OFFSETS
# if defined (WIN32)
#  define LZF_USE_OFFSETS defined(_M_X64)
# else
#  if __cplusplus > 199711L
#   include <cstdint>
#  else
#   include <stdint.h>
#  endif
#  define LZF_USE_OFFSETS (UINTPTR_MAX > 0xffffffffU)
# endif
#endif

typedef unsigned char u8;

#if LZF_USE_OFFSETS
# define LZF_HSLOT_BIAS ((const u8 *)in_data)
  typedef unsigned int LZF_HSLOT;
#else
# define LZF_HSLOT_BIAS 0
  typedef const u8 *LZF_HSLOT;
#endif

typedef LZF_HSLOT LZF_STATE[1 << (HLOG)];

#if !STRICT_ALIGN
/* for unaligned accesses we need a 16 bit datatype. */
# if USHRT_MAX == 65535
    typedef unsigned short u16;
# elif UINT_MAX == 65535
    typedef unsigned int u16;
# else
#  undef STRICT_ALIGN
#  define STRICT_ALIGN 1
# endif
#endif

#if ULTRA_FAST
# undef VERY_FAST
#endif

#endif


================================================
FILE: src/vr_lzf_c.c
================================================
#include <vr_lzfP.h>

#define HSIZE (1 << (HLOG))

/*
 * don't play with this unless you benchmark!
 * the data format is not dependent on the hash function.
 * the hash function might seem strange, just believe me,
 * it works ;)
 */
#ifndef FRST
# define FRST(p) (((p[0]) << 8) | p[1])
# define NEXT(v,p) (((v) << 8) | p[2])
# if ULTRA_FAST
#  define IDX(h) ((( h             >> (3*8 - HLOG)) - h  ) & (HSIZE - 1))
# elif VERY_FAST
#  define IDX(h) ((( h             >> (3*8 - HLOG)) - h*5) & (HSIZE - 1))
# else
#  define IDX(h) ((((h ^ (h << 5)) >> (3*8 - HLOG)) - h*5) & (HSIZE - 1))
# endif
#endif
/*
 * IDX works because it is very similar to a multiplicative hash, e.g.
 * ((h * 57321 >> (3*8 - HLOG)) & (HSIZE - 1))
 * the latter is also quite fast on newer CPUs, and compresses similarly.
 *
 * the next one is also quite good, albeit slow ;)
 * (int)(cos(h & 0xffffff) * 1e6)
 */

#if 0
/* original lzv-like hash function, much worse and thus slower */
# define FRST(p) (p[0] << 5) ^ p[1]
# define NEXT(v,p) ((v) << 5) ^ p[2]
# define IDX(h) ((h) & (HSIZE - 1))
#endif

#define        MAX_LIT        (1 <<  5)
#define        MAX_OFF        (1 << 13)
#define        MAX_REF        ((1 << 8) + (1 << 3))

#if __GNUC__ >= 3
# define expect(expr,value)         __builtin_expect ((expr),(value))
# define inline                     inline
#else
# define expect(expr,value)         (expr)
# define inline                     static
#endif

#define expect_false(expr) expect ((expr) != 0, 0)
#define expect_true(expr)  expect ((expr) != 0, 1)

/*
 * compressed format
 *
 * 000LLLLL <L+1>    ; literal, L+1=1..33 octets
 * LLLooooo oooooooo ; backref L+1=1..7 octets, o+1=1..4096 offset
 * 111ooooo LLLLLLLL oooooooo ; backref L+8 octets, o+1=1..4096 offset
 *
 */

unsigned int
lzf_compress (const void *const in_data, unsigned int in_len,
	      void *out_data, unsigned int out_len
#if LZF_STATE_ARG
              , LZF_STATE htab
#endif
              )
{
#if !LZF_STATE_ARG
  LZF_STATE htab;
#endif
  const u8 *ip = (const u8 *)in_data;
        u8 *op = (u8 *)out_data;
  const u8 *in_end  = ip + in_len;
        u8 *out_end = op + out_len;
  const u8 *ref;

  /* off requires a type wide enough to hold a general pointer difference.
   * ISO C doesn't have that (size_t might not be enough and ptrdiff_t only
   * works for differences within a single object). We also assume that no
   * no bit pattern traps. Since the only platform that is both non-POSIX
   * and fails to support both assumptions is windows 64 bit, we make a
   * special workaround for it.
   */
#if defined (WIN32) && defined (_M_X64)
  unsigned _int64 off; /* workaround for missing POSIX compliance */
#else
  unsigned long off;
#endif
  unsigned int hval;
  int lit;

  if (!in_len || !out_len)
    return 0;

#if INIT_HTAB
  memset (htab, 0, sizeof (htab));
#endif

  lit = 0; op++; /* start run */

  hval = FRST (ip);
  while (ip < in_end - 2)
    {
      LZF_HSLOT *hslot;

      hval = NEXT (hval, ip);
      hslot = htab + IDX (hval);
      ref = *hslot + LZF_HSLOT_BIAS; *hslot = ip - LZF_HSLOT_BIAS;

      if (1
#if INIT_HTAB
          && ref < ip /* the next test will actually take care of this, but this is faster */
#endif
          && (off = ip - ref - 1) < MAX_OFF
          && ref > (u8 *)in_data
          && ref[2] == ip[2]
#if STRICT_ALIGN
          && ((ref[1] << 8) | ref[0]) == ((ip[1] << 8) | ip[0])
#else
          && *(u16 *)ref == *(u16 *)ip
#endif
        )
        {
          /* match found at *ref++ */
          unsigned int len = 2;
          unsigned int maxlen = in_end - ip - len;
          maxlen = maxlen > MAX_REF ? MAX_REF : maxlen;

          if (expect_false (op + 3 + 1 >= out_end)) /* first a faster conservative test */
            if (op - !lit + 3 + 1 >= out_end) /* second the exact but rare test */
              return 0;

          op [- lit - 1] = lit - 1; /* stop run */
          op -= !lit; /* undo run if length is zero */

          for (;;)
            {
              if (expect_true (maxlen > 16))
                {
                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;

                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;

                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;

                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;
                  len++; if (ref [len] != ip [len]) break;
                }

              do
                len++;
              while (len < maxlen && ref[len] == ip[len]);

              break;
            }

          len -= 2; /* len is now #octets - 1 */
          ip++;

          if (len < 7)
            {
              *op++ = (off >> 8) + (len << 5);
            }
          else
            {
              *op++ = (off >> 8) + (  7 << 5);
              *op++ = len - 7;
            }

          *op++ = off;

          lit = 0; op++; /* start run */

          ip += len + 1;

          if (expect_false (ip >= in_end - 2))
            break;

#if ULTRA_FAST || VERY_FAST
          --ip;
# if VERY_FAST && !ULTRA_FAST
          --ip;
# endif
          hval = FRST (ip);

          hval = NEXT (hval, ip);
          htab[IDX (hval)] = ip - LZF_HSLOT_BIAS;
          ip++;

# if VERY_FAST && !ULTRA_FAST
          hval = NEXT (hval, ip);
          htab[IDX (hval)] = ip - LZF_HSLOT_BIAS;
          ip++;
# endif
#else
          ip -= len + 1;

          do
            {
              hval = NEXT (hval, ip);
              htab[IDX (hval)] = ip - LZF_HSLOT_BIAS;
              ip++;
            }
          while (len--);
#endif
        }
      else
        {
          /* one more literal byte we must copy */
          if (expect_false (op >= out_end))
            return 0;

          lit++; *op++ = *ip++;

          if (expect_false (lit == MAX_LIT))
            {
              op [- lit - 1] = lit - 1; /* stop run */
              lit = 0; op++; /* start run */
            }
        }
    }

  if (op + 3 > out_end) /* at most 3 bytes can be missing here */
    return 0;

  while (ip < in_end)
    {
      lit++; *op++ = *ip++;

      if (expect_false (lit == MAX_LIT))
        {
          op [- lit - 1] = lit - 1; /* stop run */
          lit = 0; op++; /* start run */
        }
    }

  op [- lit - 1] = lit - 1; /* end run */
  op -= !lit; /* undo run if length is zero */

  return op - (u8 *)out_data;
}


================================================
FILE: src/vr_lzf_d.c
================================================
#include <vr_lzfP.h>

#if AVOID_ERRNO
# define SET_ERRNO(n)
#else
# include <errno.h>
# define SET_ERRNO(n) errno = (n)
#endif

#if USE_REP_MOVSB /* small win on amd, big loss on intel */
#if (__i386 || __amd64) && __GNUC__ >= 3
# define lzf_movsb(dst, src, len)                \
   asm ("rep movsb"                              \
        : "=D" (dst), "=S" (src), "=c" (len)     \
        :  "0" (dst),  "1" (src),  "2" (len));
#endif
#endif

unsigned int
lzf_decompress (const void *const in_data,  unsigned int in_len,
                void             *out_data, unsigned int out_len)
{
  u8 const *ip = (const u8 *)in_data;
  u8       *op = (u8 *)out_data;
  u8 const *const in_end  = ip + in_len;
  u8       *const out_end = op + out_len;

  do
    {
      unsigned int ctrl = *ip++;

      if (ctrl < (1 << 5)) /* literal run */
        {
          ctrl++;

          if (op + ctrl > out_end)
            {
              SET_ERRNO (E2BIG);
              return 0;
            }

#if CHECK_INPUT
          if (ip + ctrl > in_end)
            {
              SET_ERRNO (EINVAL);
              return 0;
            }
#endif

#ifdef lzf_movsb
          lzf_movsb (op, ip, ctrl);
#else
          switch (ctrl)
            {
              case 32: *op++ = *ip++; case 31: *op++ = *ip++; case 30: *op++ = *ip++; case 29: *op++ = *ip++;
              case 28: *op++ = *ip++; case 27: *op++ = *ip++; case 26: *op++ = *ip++; case 25: *op++ = *ip++;
              case 24: *op++ = *ip++; case 23: *op++ = *ip++; case 22: *op++ = *ip++; case 21: *op++ = *ip++;
              case 20: *op++ = *ip++; case 19: *op++ = *ip++; case 18: *op++ = *ip++; case 17: *op++ = *ip++;
              case 16: *op++ = *ip++; case 15: *op++ = *ip++; case 14: *op++ = *ip++; case 13: *op++ = *ip++;
              case 12: *op++ = *ip++; case 11: *op++ = *ip++; case 10: *op++ = *ip++; case  9: *op++ = *ip++;
              case  8: *op++ = *ip++; case  7: *op++ = *ip++; case  6: *op++ = *ip++; case  5: *op++ = *ip++;
              case  4: *op++ = *ip++; case  3: *op++ = *ip++; case  2: *op++ = *ip++; case  1: *op++ = *ip++;
            }
#endif
        }
      else /* back reference */
        {
          unsigned int len = ctrl >> 5;

          u8 *ref = op - ((ctrl & 0x1f) << 8) - 1;

#if CHECK_INPUT
          if (ip >= in_end)
            {
              SET_ERRNO (EINVAL);
              return 0;
            }
#endif
          if (len == 7)
            {
              len += *ip++;
#if CHECK_INPUT
              if (ip >= in_end)
                {
                  SET_ERRNO (EINVAL);
                  return 0;
                }
#endif
            }

          ref -= *ip++;

          if (op + len + 2 > out_end)
            {
              SET_ERRNO (E2BIG);
              return 0;
            }

          if (ref < (u8 *)out_data)
            {
              SET_ERRNO (EINVAL);
              return 0;
            }

#ifdef lzf_movsb
          len += 2;
          lzf_movsb (op, ref, len);
#else
          switch (len)
            {
              default:
                len += 2;

                if (op >= ref + len)
                  {
                    /* disjunct areas */
                    memcpy (op, ref, len);
                    op += len;
                  }
                else
                  {
                    /* overlapping, use octte by octte copying */
                    do
                      *op++ = *ref++;
                    while (--len);
                  }

                break;

              case 9: *op++ = *ref++;
              case 8: *op++ = *ref++;
              case 7: *op++ = *ref++;
              case 6: *op++ = *ref++;
              case 5: *op++ = *ref++;
              case 4: *op++ = *ref++;
              case 3: *op++ = *ref++;
              case 2: *op++ = *ref++;
              case 1: *op++ = *ref++;
              case 0: *op++ = *ref++; /* two octets more */
                      *op++ = *ref++;
            }
#endif
        }
    }
  while (ip < in_end);

  return op - (u8 *)out_data;
}


================================================
FILE: src/vr_master.c
================================================
#include <vr_core.h>

vr_master master;

static int setup_master(void);
static void *master_thread_run(void *args);

int
master_init(vr_conf *conf)
{
    rstatus_t status;
    uint32_t j;
    sds *host, listen_str;
    vr_listen **vlisten;
    int threads_num;
    int filelimit;

    master.cbsul = NULL;
    pthread_mutex_init(&master.cbsullock, NULL);

    conf_server_get(CONFIG_SOPN_THREADS,&threads_num);
    filelimit = threads_num*2+CONFIG_MIN_RESERVED_FDS;
    vr_eventloop_init(&master.vel,filelimit);
    master.vel.thread.fun_run = master_thread_run;

    darray_init(&master.listens,darray_n(&cserver->binds),sizeof(vr_listen*));

    for (j = 0; j < darray_n(&cserver->binds); j ++) {
        host = darray_get(&cserver->binds,j);
        listen_str = sdsdup(*host);
        listen_str = sdscatfmt(listen_str, ":%i", cserver->port);
        vlisten = darray_push(&master.listens);
        *vlisten = vr_listen_create(listen_str);
        if (*vlisten == NULL) {
            darray_pop(&master.listens);
            log_error("Create listen %s failed", listen_str);
            sdsfree(listen_str);
            return VR_ERROR;
        }
        sdsfree(listen_str);
    }

    for (j = 0; j < darray_n(&master.listens); j ++) {
        vlisten = darray_get(&master.listens, j);
        status = vr_listen_begin(*vlisten);
        if (status != VR_OK) {
            log_error("Begin listen to %s failed", (*vlisten)->name);
            return VR_ERROR;
        }
    }

    master.cbsul = dlistCreate();
    if (master.cbsul == NULL) {
        log_error("Create list failed: out of memory");
        return VR_ENOMEM;
    }

    setup_master();

    return VR_OK;
}

void
master_deinit(void)
{
    vr_listen **vlisten;
    
    vr_eventloop_deinit(&master.vel);

    while (darray_n(&master.listens) > 0) {
        vlisten = darray_pop(&master.listens);
        vr_listen_destroy(*vlisten);
    }
    darray_deinit(&master.listens);
    
}

static void
client_accept(aeEventLoop *el, int fd, void *privdata, int mask) {
    int sd;
    vr_listen *vlisten = privdata;

    while((sd = vr_listen_accept(vlisten)) > 0) {
        dispatch_conn_new(vlisten, sd);
    }
}

static void
cbsul_push(struct connswapunit *su)
{
    pthread_mutex_lock(&master.cbsullock);
    dlistPush(master.cbsul, su);
    pthread_mutex_unlock(&master.cbsullock);
}

static struct connswapunit *
cbsul_pop(void)
{
    struct connswapunit *su = NULL;

    pthread_mutex_lock(&master.cbsullock);
    su = dlistPop(master.cbsul);
    pthread_mutex_unlock(&master.cbsullock);
    
    return su;
}

void
dispatch_conn_exist(client *c, int tid)
{
    struct connswapunit *su = csui_new();
    char buf[1];
    vr_worker *worker;

    if (su == NULL) {
        freeClient(c);
        /* given that malloc failed this may also fail, but let's try */
        log_error("Failed to allocate memory for connection swap object\n");
        return ;
    }

    su->num = tid;
    su->data = c;
    
    unlinkClientFromEventloop(c);

    cbsul_push(su);

    worker = darray_get(&workers, (uint32_t)c->curidx);

    /* Back to master */
    buf[0] = 'b';
    if (vr_write(worker->socketpairs[1], buf, 1) != 1) {
        log_error("Notice the worker failed.");
    }
}

static void
thread_event_process(aeEventLoop *el, int fd, void *privdata, int mask) {

    rstatus_t status;
    vr_worker *worker = privdata;
    char buf[1];
    int idx;
    client *c;
    struct connswapunit *su;

    ASSERT(el == master.vel.el);
    ASSERT(fd == worker->socketpairs[0]);

    if (vr_read(fd, buf, 1) != 1) {
        log_warn("Can't read for worker(id:%d) socketpairs[1](%d)", 
            worker->vel.thread.id, fd);
        buf[0] = 'b';
    }
    
    switch (buf[0]) {
    case 'b':
        su = cbsul_pop();
        if (su == NULL) {
            log_warn("Pop from connection back swap list is null");
            return;
        }
        
        idx = su->num;
        su->num = worker->id;
        worker = darray_get(&workers, (uint32_t)idx);
        csul_push(worker, su);

        /* Jump to the target worker. */
        buf[0] = 'j';
        if (vr_write(worker->socketpairs[0], buf, 1) != 1) {
            log_error("Notice the worker failed.");
        }
        break;
    default:
        log_error("read error char '%c' for worker(id:%d) socketpairs[0](%d)", 
            buf[0], worker->vel.thread.id, worker->socketpairs[1]);
        break;
    }
}

static int
setup_master(void)
{
    rstatus_t status;
    uint32_t j;
    vr_listen **vlisten;
    vr_worker *worker;

    for (j = 0; j < darray_n(&workers); j ++) {
        worker = darray_get(&workers, j);
        status = aeCreateFileEvent(master.vel.el, worker->socketpairs[0], 
            AE_READABLE, thread_event_process, worker);
        if (status == AE_ERR) {
            log_error("Unrecoverable error creating master ipfd file event.");
            return VR_ERROR;
        }
    }

    for (j = 0; j < darray_n(&master.listens); j ++) {
        vlisten = darray_get(&master.listens,j);
        status = aeCreateFileEvent(master.vel.el, (*vlisten)->sd, AE_READABLE, 
            client_accept, *vlisten);
        if (status == AE_ERR) {
            log_error("Unrecoverable error creating master ipfd file event.");
            return VR_ERROR;
        }
    }
    
    return VR_OK;
}

static void *
master_thread_run(void *args)
{    
    /* vire master run */
    aeMain(master.vel.el);

    return NULL;
}

int
master_run(void)
{
    vr_thread_start(&master.vel.thread);
    return VR_OK;
}


================================================
FILE: src/vr_master.h
================================================
#ifndef _VR_MASTER_H_
#define _VR_MASTER_H_

typedef struct vr_master {

    vr_eventloop vel;
    
    struct darray listens;   /* type: vr_listen */

    dlist *cbsul;    /* Connect back swap unit list */
    pthread_mutex_t cbsullock;   /* swap unit list locker */
}vr_master;

extern vr_master master;

int master_init(vr_conf *conf);
void master_deinit(void);

void dispatch_conn_exist(struct client *c, int tid);

int master_run(void);

#endif


================================================
FILE: src/vr_multi.c
================================================
#include <vr_core.h>

/* ===================== WATCH (CAS alike for MULTI/EXEC) ===================
 *
 * The implementation uses a per-DB hash table mapping keys to list of clients
 * WATCHing those keys, so that given a key that is going to be modified
 * we can mark all the associated clients as dirty.
 *
 * Also every client contains a list of WATCHed keys so that's possible to
 * un-watch such keys when the client is freed or when UNWATCH is called. */

/* In the client->watched_keys list we need to use watchedKey structures
 * as in order to identify a key in Redis we need both the key name and the
 * DB */
typedef struct watchedKey {
    robj *key;
    redisDb *db;
} watchedKey;

/* Unwatch all the keys watched by this client. To clean the EXEC dirty
 * flag is up to the caller. */
void unwatchAllKeys(client *c) {
    dlistIter li;
    dlistNode *ln;

    if (dlistLength(c->watched_keys) == 0) return;
    dlistRewind(c->watched_keys,&li);
    while((ln = dlistNext(&li))) {
        dlist *clients;
        watchedKey *wk;

        /* Lookup the watched key -> clients list and remove the client
         * from the list */
        wk = dlistNodeValue(ln);
        clients = dictFetchValue(wk->db->watched_keys, wk->key);
        serverAssertWithInfo(c,NULL,clients != NULL);
        dlistDelNode(clients,dlistSearchKey(clients,c));
        /* Kill the entry at all if this was the only client */
        if (dlistLength(clients) == 0)
            dictDelete(wk->db->watched_keys, wk->key);
        /* Remove this watched key from the client->watched list */
        dlistDelNode(c->watched_keys,ln);
        decrRefCount(wk->key);
        dfree(wk);
    }
}

/* Client state initialization for MULTI/EXEC */
void initClientMultiState(client *c) {
    c->mstate.commands = NULL;
    c->mstate.count = 0;
}

/* Release all the resources associated with MULTI/EXEC state */
void freeClientMultiState(client *c) {
    int j;

    for (j = 0; j < c->mstate.count; j++) {
        int i;
        multiCmd *mc = c->mstate.commands+j;

        for (i = 0; i < mc->argc; i++)
            decrRefCount(mc->argv[i]);
        dfree(mc->argv);
    }
    if (c->mstate.commands) dfree(c->mstate.commands);
}

/* Add a new command into the MULTI commands queue */
void queueMultiCommand(client *c) {
    multiCmd *mc;
    int j;

    c->mstate.commands = drealloc(c->mstate.commands,
            sizeof(multiCmd)*(c->mstate.count+1));
    mc = c->mstate.commands+c->mstate.count;
    mc->cmd = c->cmd;
    mc->argc = c->argc;
    mc->argv = dalloc(sizeof(robj*)*c->argc);
    memcpy(mc->argv,c->argv,sizeof(robj*)*c->argc);
    for (j = 0; j < c->argc; j++)
        incrRefCount(mc->argv[j]);
    c->mstate.count++;
}

/* Flag the transacation as DIRTY_EXEC so that EXEC will fail.
 * Should be called every time there is an error while queueing a command. */
void flagTransaction(client *c) {
    if (c->flags & CLIENT_MULTI)
        c->flags |= CLIENT_DIRTY_EXEC;
}

void execCommand(client *c) {
    addReply(c,shared.ok);
}

void discardCommand(client *c) {
    if (!(c->flags & CLIENT_MULTI)) {
        addReplyError(c,"DISCARD without MULTI");
        return;
    }
    discardTransaction(c);
    addReply(c,shared.ok);
}

void discardTransaction(client *c) {
    freeClientMultiState(c);
    initClientMultiState(c);
    c->flags &= ~(CLIENT_MULTI|CLIENT_DIRTY_CAS|CLIENT_DIRTY_EXEC);
    unwatchAllKeys(c);
}

void multiCommand(client *c) {
    if (c->flags & CLIENT_MULTI) {
        addReplyError(c,"MULTI calls can not be nested");
        return;
    }
    c->flags |= CLIENT_MULTI;
    addReply(c,shared.ok);
}

/* Watch for the specified key */
void watchForKey(client *c, robj *key) {
    dlist *clients = NULL;
    dlistIter li;
    dlistNode *ln;
    watchedKey *wk;

    /* Check if we are already watching for this key */
    dlistRewind(c->watched_keys,&li);
    while((ln = dlistNext(&li))) {
        wk = dlistNodeValue(ln);
        if (wk->db == c->db && equalStringObjects(key,wk->key))
            return; /* Key already watched */
    }
    /* This key is not already watched in this DB. Let's add it */
    clients = dictFetchValue(c->db->watched_keys,key);
    if (!clients) {
        clients = dlistCreate();
        dictAdd(c->db->watched_keys,key,clients);
        incrRefCount(key);
    }
    dlistAddNodeTail(clients,c);
    /* Add the new key to the list of keys watched by this client */
    wk = dalloc(sizeof(*wk));
    wk->key = key;
    wk->db = c->db;
    incrRefCount(key);
    dlistAddNodeTail(c->watched_keys,wk);
}

void watchCommand(client *c) {
    int j;

    if (c->flags & CLIENT_MULTI) {
        addReplyError(c,"WATCH inside MULTI is not allowed");
        return;
    }
    for (j = 1; j < c->argc; j++)
        watchForKey(c,c->argv[j]);
    addReply(c,shared.ok);
}

/* "Touch" a key, so that if this key is being WATCHed by some client the
 * next EXEC will fail. */
void touchWatchedKey(redisDb *db, robj *key) {
    dlist *clients;
    dlistIter li;
    dlistNode *ln;

    if (dictSize(db->watched_keys) == 0) return;
    clients = dictFetchValue(db->watched_keys, key);
    if (!clients) return;

    /* Mark all the clients watching this key as CLIENT_DIRTY_CAS */
    /* Check if we are already watching for this key */
    dlistRewind(clients,&li);
    while((ln = dlistNext(&li))) {
        client *c = dlistNodeValue(ln);

        c->flags |= CLIENT_DIRTY_CAS;
    }
}

/* On FLUSHDB or FLUSHALL all the watched keys that are present before the
 * flush but will be deleted as effect of the flushing operation should
 * be touched. "dbid" is the DB that's getting the flush. -1 if it is
 * a FLUSHALL operation (all the DBs flushed). */
void touchWatchedKeysOnFlush(int dbid) {
    dlistIter li1, li2;
    dlistNode *ln;

    /* For every client, check all the waited keys */
    dlistRewind(server.clients,&li1);
    while((ln = dlistNext(&li1))) {
        client *c = dlistNodeValue(ln);
        dlistRewind(c->watched_keys,&li2);
        while((ln = dlistNext(&li2))) {
            watchedKey *wk = dlistNodeValue(ln);

            /* For every watched key matching the specified DB, if the
             * key exists, mark the client as dirty, as the key will be
             * removed. */
            if (dbid == -1 || wk->db->id == dbid) {
                if (dictFind(wk->db->dict, wk->key->ptr) != NULL)
                    c->flags |= CLIENT_DIRTY_CAS;
            }
        }
    }
}


================================================
FILE: src/vr_multi.h
================================================
#ifndef _VR_MULTI_H_
#define _VR_MULTI_H_

/* Client MULTI/EXEC state */
typedef struct multiCmd {
    robj **argv;
    int argc;
    struct redisCommand *cmd;
} multiCmd;

typedef struct multiState {
    multiCmd *commands;     /* Array of MULTI commands */
    int count;              /* Total number of MULTI commands */
    int minreplicas;        /* MINREPLICAS for synchronous replication */
    time_t minreplicas_timeout; /* MINREPLICAS timeout as unixtime. */
} multiState;

void unwatchAllKeys(struct client *c);
void initClientMultiState(struct client *c);
void freeClientMultiState(struct client *c);
void queueMultiCommand(struct client *c);

void flagTransaction(struct client *c);
void execCommand(struct client *c);
void discardCommand(struct client *c);
void discardTransaction(struct client *c);
void multiCommand(struct client *c);
void watchForKey(struct client *c, robj *key);
void watchCommand(struct client *c);
void touchWatchedKey(redisDb *db, robj *key);
void touchWatchedKeysOnFlush(int dbid) ;

#endif


================================================
FILE: src/vr_notify.c
================================================
#include <vr_core.h>

/* This file implements keyspace events notification via Pub/Sub ad
 * described at http://redis.io/topics/keyspace-events. */

/* Turn a string representing notification classes into an integer
 * representing notification classes flags xored.
 *
 * The function returns -1 if the input contains characters not mapping to
 * any class. */
int keyspaceEventsStringToFlags(char *classes) {
    char *p = classes;
    int c, flags = 0;

    while((c = *p++) != '\0') {
        switch(c) {
        case 'A': flags |= NOTIFY_ALL; break;
        case 'g': flags |= NOTIFY_GENERIC; break;
        case '$': flags |= NOTIFY_STRING; break;
        case 'l': flags |= NOTIFY_LIST; break;
        case 's': flags |= NOTIFY_SET; break;
        case 'h': flags |= NOTIFY_HASH; break;
        case 'z': flags |= NOTIFY_ZSET; break;
        case 'x': flags |= NOTIFY_EXPIRED; break;
        case 'e': flags |= NOTIFY_EVICTED; break;
        case 'K': flags |= NOTIFY_KEYSPACE; break;
        case 'E': flags |= NOTIFY_KEYEVENT; break;
        default: return -1;
        }
    }
    return flags;
}

/* This function does exactly the revese of the function above: it gets
 * as input an integer with the xored flags and returns a string representing
 * the selected classes. The string returned is an sds string that needs to
 * be released with sdsfree(). */
sds keyspaceEventsFlagsToString(int flags) {
    sds res;

    res = sdsempty();
    if ((flags & NOTIFY_ALL) == NOTIFY_ALL) {
        res = sdscatlen(res,"A",1);
    } else {
        if (flags & NOTIFY_GENERIC) res = sdscatlen(res,"g",1);
        if (flags & NOTIFY_STRING) res = sdscatlen(res,"$",1);
        if (flags & NOTIFY_LIST) res = sdscatlen(res,"l",1);
        if (flags & NOTIFY_SET) res = sdscatlen(res,"s",1);
        if (flags & NOTIFY_HASH) res = sdscatlen(res,"h",1);
        if (flags & NOTIFY_ZSET) res = sdscatlen(res,"z",1);
        if (flags & NOTIFY_EXPIRED) res = sdscatlen(res,"x",1);
        if (flags & NOTIFY_EVICTED) res = sdscatlen(res,"e",1);
    }
    if (flags & NOTIFY_KEYSPACE) res = sdscatlen(res,"K",1);
    if (flags & NOTIFY_KEYEVENT) res = sdscatlen(res,"E",1);
    return res;
}

/* The API provided to the rest of the Redis core is a simple function:
 *
 * notifyKeyspaceEvent(char *event, robj *key, int dbid);
 *
 * 'event' is a C string representing the event name.
 * 'key' is a Redis object representing the key name.
 * 'dbid' is the database ID where the key lives.  */
void notifyKeyspaceEvent(int type, char *event, robj *key, int dbid) {
    sds chan;
    robj *chanobj, *eventobj;
    int len = -1;
    char buf[24];

    /* If notifications for this class of events are off, return ASAP. */
    if (!(server.notify_keyspace_events & type)) return;

    eventobj = createStringObject(event,strlen(event));

    /* __keyspace@<db>__:<key> <event> notifications. */
    if (server.notify_keyspace_events & NOTIFY_KEYSPACE) {
        chan = sdsnewlen("__keyspace@",11);
        len = ll2string(buf,sizeof(buf),dbid);
        chan = sdscatlen(chan, buf, len);
        chan = sdscatlen(chan, "__:", 3);
        chan = sdscatsds(chan, key->ptr);
        chanobj = createObject(OBJ_STRING, chan);
        pubsubPublishMessage(chanobj, eventobj);
        decrRefCount(chanobj);
    }

    /* __keyevente@<db>__:<event> <key> notifications. */
    if (server.notify_keyspace_events & NOTIFY_KEYEVENT) {
        chan = sdsnewlen("__keyevent@",11);
        if (len == -1) len = ll2string(buf,sizeof(buf),dbid);
        chan = sdscatlen(chan, buf, len);
        chan = sdscatlen(chan, "__:", 3);
        chan = sdscatsds(chan, eventobj->ptr);
        chanobj = createObject(OBJ_STRING, chan);
        pubsubPublishMessage(chanobj, key);
        decrRefCount(chanobj);
    }
    decrRefCount(eventobj);
}


================================================
FILE: src/vr_notify.h
================================================
#ifndef _VR_NOTIFY_H_
#define _VR_NOTIFY_H_

/* Keyspace changes notification classes. Every class is associated with a
 * character for configuration purposes. */
#define NOTIFY_KEYSPACE (1<<0)    /* K */
#define NOTIFY_KEYEVENT (1<<1)    /* E */
#define NOTIFY_GENERIC (1<<2)     /* g */
#define NOTIFY_STRING (1<<3)      /* $ */
#define NOTIFY_LIST (1<<4)        /* l */
#define NOTIFY_SET (1<<5)         /* s */
#define NOTIFY_HASH (1<<6)        /* h */
#define NOTIFY_ZSET (1<<7)        /* z */
#define NOTIFY_EXPIRED (1<<8)     /* x */
#define NOTIFY_EVICTED (1<<9)     /* e */
#define NOTIFY_ALL (NOTIFY_GENERIC | NOTIFY_STRING | NOTIFY_LIST | NOTIFY_SET | NOTIFY_HASH | NOTIFY_ZSET | NOTIFY_EXPIRED | NOTIFY_EVICTED)      /* A */


#endif


================================================
FILE: src/vr_object.c
================================================
#include <math.h>
#include <ctype.h>

#include <vr_core.h>

#ifdef __CYGWIN__
#define strtold(a,b) ((long double)strtod((a),(b)))
#endif

robj *createObject(int type, void *ptr) {
    robj *o = dalloc(sizeof(*o));
    o->type = type;
    o->encoding = OBJ_ENCODING_RAW;
    o->ptr = ptr;
    o->constant = 0;
    o->refcount = -1;
    o->lru = 0;
    return o;
}

/* Create a string object with encoding OBJ_ENCODING_RAW, that is a plain
 * string object where o->ptr points to a proper sds string. */
robj *createRawStringObject(const char *ptr, size_t len) {
    return createObject(OBJ_STRING,sdsnewlen(ptr,len));
}

/* Create a string object with encoding OBJ_ENCODING_EMBSTR, that is
 * an object where the sds string is actually an unmodifiable string
 * allocated in the same chunk as the object itself. */
robj *createEmbeddedStringObject(const char *ptr, size_t len) {
    robj *o = dalloc(sizeof(robj)+sizeof(struct sdshdr8)+len+1);
    struct sdshdr8 *sh = (void*)(o+1);

    o->type = OBJ_STRING;
    o->encoding = OBJ_ENCODING_EMBSTR;
    o->ptr = sh+1;
    o->constant = 0;
    o->refcount = -1;
    o->lru = 0;

    sh->len = len;
    sh->alloc = len;
    sh->flags = SDS_TYPE_8;
    if (ptr) {
        memcpy(sh->buf,ptr,len);
        sh->buf[len] = '\0';
    } else {
        memset(sh->buf,0,len+1);
    }
    return o;
}

/* Create a string object with EMBSTR encoding if it is smaller than
 * REIDS_ENCODING_EMBSTR_SIZE_LIMIT, otherwise the RAW encoding is
 * used.
 *
 * The current limit of 39 is chosen so that the biggest string object
 * we allocate as EMBSTR will still fit into the 64 byte arena of jemalloc. */
#define OBJ_ENCODING_EMBSTR_SIZE_LIMIT 44
robj *createStringObject(const char *ptr, size_t len) {
    if (len <= OBJ_ENCODING_EMBSTR_SIZE_LIMIT)
        return createEmbeddedStringObject(ptr,len);
    else
        return createRawStringObject(ptr,len);
}

robj *createStringObjectFromLongLong(long long value) {
    robj *o;
    if (value >= 0 && value < OBJ_SHARED_INTEGERS) {
        o = shared.integers[value];
    } else {
        if (value >= LONG_MIN && value <= LONG_MAX) {
            o = createObject(OBJ_STRING, NULL);
            o->encoding = OBJ_ENCODING_INT;
            o->ptr = (void*)((long)value);
        } else {
            o = createObject(OBJ_STRING,sdsfromlonglong(value));
        }
    }
    return o;
}

/* Create a string object from a long double. If humanfriendly is non-zero
 * it does not use exponential format and trims trailing zeroes at the end,
 * however this results in loss of precision. Otherwise exp format is used
 * and the output of snprintf() is not modified.
 *
 * The 'humanfriendly' option is used for INCRBYFLOAT and HINCRBYFLOAT. */
robj *createStringObjectFromLongDouble(long double value, int humanfriendly) {
    char buf[256];
    int len;

    if (isinf(value)) {
        /* Libc in odd systems (Hi Solaris!) will format infinite in a
         * different way, so better to handle it in an explicit way. */
        if (value > 0) {
            memcpy(buf,"inf",3);
            len = 3;
        } else {
            memcpy(buf,"-inf",4);
            len = 4;
        }
    } else if (humanfriendly) {
        /* We use 17 digits precision since with 128 bit floats that precision
         * after rounding is able to represent most small decimal numbers in a
         * way that is "non surprising" for the user (that is, most small
         * decimal numbers will be represented in a way that when converted
         * back into a string are exactly the same as what the user typed.) */
        len = snprintf(buf,sizeof(buf),"%.17Lf", value);
        /* Now remove trailing zeroes after the '.' */
        if (strchr(buf,'.') != NULL) {
            char *p = buf+len-1;
            while(*p == '0') {
                p--;
                len--;
            }
            if (*p == '.') len--;
        }
    } else {
        len = snprintf(buf,sizeof(buf),"%.17Lg", value);
    }
    return createStringObject(buf,len);
}

/* Duplicate a string object, with the guarantee that the returned object
 * has the same encoding as the original one.
 *
 * This function also guarantees that duplicating a small integere object
 * (or a string object that contains a representation of a small integer)
 * will always result in a fresh object that is unshared (refcount == 1).
 *
 * The resulting object always has refcount set to 1. */
robj *dupStringObject(robj *o) {
    robj *d;

    ASSERT(o->type == OBJ_STRING);

    switch(o->encoding) {
    case OBJ_ENCODING_RAW:
        return createRawStringObject(o->ptr,sdslen(o->ptr));
    case OBJ_ENCODING_EMBSTR:
        return createEmbeddedStringObject(o->ptr,sdslen(o->ptr));
    case OBJ_ENCODING_INT:
        d = createObject(OBJ_STRING, NULL);
        d->encoding = OBJ_ENCODING_INT;
        d->ptr = o->ptr;
        return d;
    default:
        serverPanic("Wrong encoding.");
        break;
    }
}

robj *dupStringObjectUnconstant(robj *o) {
    if (o->constant) return o;
    return dupStringObject(o);
}

robj *createQuicklistObject(void) {
    quicklist *l = quicklistCreate();
    robj *o = createObject(OBJ_LIST,l);
    o->encoding = OBJ_ENCODING_QUICKLIST;
    return o;
}

robj *createZiplistObject(void) {
    unsigned char *zl = ziplistNew();
    robj *o = createObject(OBJ_LIST,zl);
    o->encoding = OBJ_ENCODING_ZIPLIST;
    return o;
}

robj *createSetObject(void) {
    dict *d = dictCreate(&setDictType,NULL);
    robj *o = createObject(OBJ_SET,d);
    o->encoding = OBJ_ENCODING_HT;
    return o;
}

robj *createIntsetObject(void) {
    intset *is = intsetNew();
    robj *o = createObject(OBJ_SET,is);
    o->encoding = OBJ_ENCODING_INTSET;
    return o;
}

robj *createHashObject(void) {
    unsigned char *zl = ziplistNew();
    robj *o = createObject(OBJ_HASH, zl);
    o->encoding = OBJ_ENCODING_ZIPLIST;
    return o;
}

/* The member object is stored in the zs->dict. 
  * You can use the member in the zs->zsl just 
  * when zs->dict was not released.
  */
robj *createZsetObject(void) {
    zset *zs = dalloc(sizeof(*zs));
    robj *o;

    zs->dict = dictCreate(&zsetDictType,NULL);
    zs->zsl = zslCreate();
    o = createObject(OBJ_ZSET,zs);
    o->encoding = OBJ_ENCODING_SKIPLIST;
    return o;
}

robj *createZsetZiplistObject(void) {
    unsigned char *zl = ziplistNew();
    robj *o = createObject(OBJ_ZSET,zl);
    o->encoding = OBJ_ENCODING_ZIPLIST;
    return o;
}

void freeStringObject(robj *o) {
    if (o->encoding == OBJ_ENCODING_RAW) {
        sdsfree(o->ptr);
    }
}

void freeListObject(robj *o) {
    switch (o->encoding) {
    case OBJ_ENCODING_QUICKLIST:
        quicklistRelease(o->ptr);
        break;
    default:
        serverPanic("Unknown list encoding type");
    }
}

void freeSetObject(robj *o) {
    switch (o->encoding) {
    case OBJ_ENCODING_HT:
        dictRelease((dict*) o->ptr);
        break;
    case OBJ_ENCODING_INTSET:
        dfree(o->ptr);
        break;
    default:
        serverPanic("Unknown set encoding type");
    }
}

void freeZsetObject(robj *o) {
    zset *zs;
    switch (o->encoding) {
    case OBJ_ENCODING_SKIPLIST:
        zs = o->ptr;
        dictRelease(zs->dict);
        zslFree(zs->zsl);
        dfree(zs);
        break;
    case OBJ_ENCODING_ZIPLIST:
        dfree(o->ptr);
        break;
    default:
        serverPanic("Unknown sorted set encoding");
    }
}

void freeHashObject(robj *o) {
    switch (o->encoding) {
    case OBJ_ENCODING_HT:
        dictRelease((dict*) o->ptr);
        break;
    case OBJ_ENCODING_ZIPLIST:
        dfree(o->ptr);
        break;
    default:
        serverPanic("Unknown hash encoding type");
        break;
    }
}

void incrRefCount(robj *o) {
    o->refcount++;
}

void decrRefCount(robj *o) {
    if (o->refcount <= 0) serverPanic("decrRefCount against refcount <= 0");
    if (o->refcount == 1) {
        switch(o->type) {
        case OBJ_STRING: freeStringObject(o); break;
        case OBJ_LIST: freeListObject(o); break;
        case OBJ_SET: freeSetObject(o); break;
        case OBJ_ZSET: freeZsetObject(o); break;
        case OBJ_HASH: freeHashObject(o); break;
        default: serverPanic("Unknown object type"); break;
        }
        dfree(o);
    } else {
        o->refcount--;
    }
}

/* This variant of decrRefCount() gets its argument as void, and is useful
 * as free method in data structures that expect a 'void free_object(void*)'
 * prototype for the free method. */
void decrRefCountVoid(void *o) {
    decrRefCount(o);
}

void freeObject(robj *o) {
    if (o->constant) return;
    
    switch(o->type) {
    case OBJ_STRING: freeStringObject(o); break;
    case OBJ_LIST: freeListObject(o); break;
    case OBJ_SET: freeSetObject(o); break;
    case OBJ_ZSET: freeZsetObject(o); break;
    case OBJ_HASH: freeHashObject(o); break;
    default: serverPanic("Unknown object type"); break;
    }
    dfree(o);
}

void freeObjectVoid(void *o) {
    freeObject(o);
}

/* This function set the ref count to zero without freeing the object.
 * It is useful in order to pass a new object to functions incrementing
 * the ref count of the received object. Example:
 *
 *    functionThatWillIncrementRefCount(resetRefCount(CreateObject(...)));
 *
 * Otherwise you need to resort to the less elegant pattern:
 *
 *    *obj = createObject(...);
 *    functionThatWillIncrementRefCount(obj);
 *    decrRefCount(obj);
 */
robj *resetRefCount(robj *obj) {
    obj->refcount = 0;
    return obj;
}

int checkType(client *c, robj *o, int type) {
    if (o->type != type) {
        addReply(c,shared.wrongtypeerr);
        return 1;
    }
    return 0;
}

int isObjectRepresentableAsLongLong(robj *o, long long *llval) {
    serverAssertWithInfo(NULL,o,o->type == OBJ_STRING);
    if (o->encoding == OBJ_ENCODING_INT) {
        if (llval) *llval = (long) o->ptr;
        return VR_OK;
    } else {
        return string2ll(o->ptr,sdslen(o->ptr),llval) ? VR_OK : VR_ERROR;
    }
}

/* Try to encode a string object in order to save space */
robj *tryObjectEncoding(robj *o) {
    long value;
    sds s = o->ptr;
    size_t len;

    /* Make sure this is a string object, the only type we encode
     * in this function. Other types use encoded memory efficient
     * representations but are handled by the commands implementing
     * the type. */
    serverAssertWithInfo(NULL,o,o->type == OBJ_STRING);

    /* We try some specialized encoding only for objects that are
     * RAW or EMBSTR encoded, in other words objects that are still
     * in represented by an actually array of chars. */
    if (!sdsEncodedObject(o)) return o;

    /* It's constant object, not encode it.  */
    if (o->constant) return o;

    /* Check if we can represent this string as a long integer.
     * Note that we are sure that a string larger than 21 chars is not
     * representable as a 32 nor 64 bit integer. */
    len = sdslen(s);
    if (len <= 21 && string2l(s,len,&value)) {
        /* This object is encodable as a long. Try to use a shared object.
         * Note that we avoid using shared integers when maxmemory is used
         * because every object needs to have a private LRU field for the LRU
         * algorithm to work well. 
         * Now we do not support LRU, so just comment it. */
        if (/*(server.maxmemory == 0 ||
             (server.maxmemory_policy != MAXMEMORY_VOLATILE_LRU &&
              server.maxmemory_policy != MAXMEMORY_ALLKEYS_LRU)) && */
            value >= 0 &&
            value < OBJ_SHARED_INTEGERS)
        {
            freeObject(o);
            return shared.integers[value];
        } else {
            if (o->encoding == OBJ_ENCODING_RAW) sdsfree(o->ptr);
            o->encoding = OBJ_ENCODING_INT;
            o->ptr = (void*) value;
            return o;
        }
    }

    /* If the string is small and is still RAW encoded,
     * try the EMBSTR encoding which is more efficient.
     * In this representation the object and the SDS string are allocated
     * in the same chunk of memory to save space and cache misses. */
    if (len <= OBJ_ENCODING_EMBSTR_SIZE_LIMIT) {
        robj *emb;

        if (o->encoding == OBJ_ENCODING_EMBSTR) return o;
        emb = createEmbeddedStringObject(s,sdslen(s));
        freeObject(o);
        return emb;
    }

    /* We can't encode the object...
     *
     * Do the last try, and at least optimize the SDS string inside
     * the string object to require little space, in case there
     * is more than 10% of free space at the end of the SDS string.
     *
     * We do that only for relatively large strings as this branch
     * is only entered if the length of the string is greater than
     * OBJ_ENCODING_EMBSTR_SIZE_LIMIT. */
    if (o->encoding == OBJ_ENCODING_RAW &&
        sdsavail(s) > len/10)
    {
        o->ptr = sdsRemoveFreeSpace(o->ptr);
    }

    /* Return the original object. */
    return o;
}

/* Get a decoded version of an encoded object (returned as a new object).
 * If the object is already raw-encoded just increment the ref count. */
robj *getDecodedObject(robj *o) {
    robj *dec;

    if (sdsEncodedObject(o)) {
        return o;
    }
    if (o->type == OBJ_STRING && o->encoding == OBJ_ENCODING_INT) {
        char buf[32];

        ll2string(buf,32,(long)o->ptr);
        dec = createStringObject(buf,strlen(buf));
        return dec;
    } else {
        serverPanic("Unknown encoding type");
    }
}

/* Compare two string objects via strcmp() or strcoll() depending on flags.
 * Note that the objects may be integer-encoded. In such a case we
 * use ll2string() to get a string representation of the numbers on the stack
 * and compare the strings, it's much faster than calling getDecodedObject().
 *
 * Important note: when REDIS_COMPARE_BINARY is used a binary-safe comparison
 * is used. */

#define REDIS_COMPARE_BINARY (1<<0)
#define REDIS_COMPARE_COLL (1<<1)

int compareStringObjectsWithFlags(robj *a, robj *b, int flags) {
    serverAssertWithInfo(NULL,a,a->type == OBJ_STRING && b->type == OBJ_STRING);
    char bufa[128], bufb[128], *astr, *bstr;
    size_t alen, blen, minlen;

    if (a == b) return 0;
    if (sdsEncodedObject(a)) {
        astr = a->ptr;
        alen = sdslen(astr);
    } else {
        alen = ll2string(bufa,sizeof(bufa),(long) a->ptr);
        astr = bufa;
    }
    if (sdsEncodedObject(b)) {
        bstr = b->ptr;
        blen = sdslen(bstr);
    } else {
        blen = ll2string(bufb,sizeof(bufb),(long) b->ptr);
        bstr = bufb;
    }
    if (flags & REDIS_COMPARE_COLL) {
        return strcoll(astr,bstr);
    } else {
        int cmp;

        minlen = (alen < blen) ? alen : blen;
        cmp = memcmp(astr,bstr,minlen);
        if (cmp == 0) return alen-blen;
        return cmp;
    }
}

/* Wrapper for compareStringObjectsWithFlags() using binary comparison. */
int compareStringObjects(robj *a, robj *b) {
    return compareStringObjectsWithFlags(a,b,REDIS_COMPARE_BINARY);
}

/* Wrapper for compareStringObjectsWithFlags() using collation. */
int collateStringObjects(robj *a, robj *b) {
    return compareStringObjectsWithFlags(a,b,REDIS_COMPARE_COLL);
}

/* Equal string objects return 1 if the two objects are the same from the
 * point of view of a string comparison, otherwise 0 is returned. Note that
 * this function is faster then checking for (compareStringObject(a,b) == 0)
 * because it can perform some more optimization. */
int equalStringObjects(robj *a, robj *b) {
    if (a->encoding == OBJ_ENCODING_INT &&
        b->encoding == OBJ_ENCODING_INT){
        /* If both strings are integer encoded just check if the stored
         * long is the same. */
        return a->ptr == b->ptr;
    } else {
        return compareStringObjects(a,b) == 0;
    }
}

size_t stringObjectLen(robj *o) {
    serverAssertWithInfo(NULL,o,o->type == OBJ_STRING);
    if (sdsEncodedObject(o)) {
        return sdslen(o->ptr);
    } else {
        return sdigits10((long)o->ptr);
    }
}

int getDoubleFromObject(robj *o, double *target) {
    double value;
    char *eptr;

    if (o == NULL) {
        value = 0;
    } else {
        serverAssertWithInfo(NULL,o,o->type == OBJ_STRING);
        if (sdsEncodedObject(o)) {
            errno = 0;
            value = strtod(o->ptr, &eptr);
            if (isspace(((char*)o->ptr)[0]) ||
                eptr[0] != '\0' ||
                (errno == ERANGE &&
                    (value == HUGE_VAL || value == -HUGE_VAL || value == 0)) ||
                errno == EINVAL ||
                isnan(value))
                return VR_ERROR;
        } else if (o->encoding == OBJ_ENCODING_INT) {
            value = (long)o->ptr;
        } else {
            serverPanic("Unknown string encoding");
        }
    }
    *target = value;
    return VR_OK;
}

int getDoubleFromObjectOrReply(client *c, robj *o, double *target, const char *msg) {
    double value;
    if (getDoubleFromObject(o, &value) != VR_OK) {
        if (msg != NULL) {
            addReplyError(c,(char*)msg);
        } else {
            addReplyError(c,"value is not a valid float");
        }
        return VR_ERROR;
    }
    *target = value;
    return VR_OK;
}

int getLongDoubleFromObject(robj *o, long double *target) {
    long double value;
    char *eptr;

    if (o == NULL) {
        value = 0;
    } else {
        serverAssertWithInfo(NULL,o,o->type == OBJ_STRING);
        if (sdsEncodedObject(o)) {
            errno = 0;
            value = strtold(o->ptr, &eptr);
            if (isspace(((char*)o->ptr)[0]) || eptr[0] != '\0' ||
                errno == ERANGE || isnan(value))
                return VR_ERROR;
        } else if (o->encoding == OBJ_ENCODING_INT) {
            value = (long)o->ptr;
        } else {
            serverPanic("Unknown string encoding");
        }
    }
    *target = value;
    return VR_OK;
}

int getLongDoubleFromObjectOrReply(client *c, robj *o, long double *target, const char *msg) {
    long double value;
    if (getLongDoubleFromObject(o, &value) != VR_OK) {
        if (msg != NULL) {
            addReplyError(c,(char*)msg);
        } else {
            addReplyError(c,"value is not a valid float");
        }
        return VR_ERROR;
    }
    *target = value;
    return VR_OK;
}

int getLongLongFromObject(robj *o, long long *target) {
    long long value;
    char *eptr;

    if (o == NULL) {
        value = 0;
    } else {
        serverAssertWithInfo(NULL,o,o->type == OBJ_STRING);
        if (sdsEncodedObject(o)) {
            errno = 0;
            value = strtoll(o->ptr, &eptr, 10);
            if (isspace(((char*)o->ptr)[0]) || eptr[0] != '\0' ||
                errno == ERANGE)
                return VR_ERROR;
        } else if (o->encoding == OBJ_ENCODING_INT) {
            value = (long)o->ptr;
        } else {
            serverPanic("Unknown string encoding");
        }
    }
    if (target) *target = value;
    return VR_OK;
}

int getLongLongFromObjectOrReply(client *c, robj *o, long long *target, const char *msg) {
    long long value;
    if (getLongLongFromObject(o, &value) != VR_OK) {
        if (msg != NULL) {
            addReplyError(c,(char*)msg);
        } else {
            addReplyError(c,"value is not an integer or out of range");
        }
        return VR_ERROR;
    }
    *target = value;
    return VR_OK;
}

int getLongFromObjectOrReply(client *c, robj *o, long *target, const char *msg) {
    long long value;

    if (getLongLongFromObjectOrReply(c, o, &value, msg) != VR_OK) return VR_ERROR;
    if (value < LONG_MIN || value > LONG_MAX) {
        if (msg != NULL) {
            addReplyError(c,(char*)msg);
        } else {
            addReplyError(c,"value is out of range");
        }
        return VR_ERROR;
    }
    *target = value;
    return VR_OK;
}

char *strEncoding(int encoding) {
    switch(encoding) {
    case OBJ_ENCODING_RAW: return "raw";
    case OBJ_ENCODING_INT: return "int";
    case OBJ_ENCODING_HT: return "hashtable";
    case OBJ_ENCODING_QUICKLIST: return "quicklist";
    case OBJ_ENCODING_ZIPLIST: return "ziplist";
    case OBJ_ENCODING_INTSET: return "intset";
    case OBJ_ENCODING_SKIPLIST: return "skiplist";
    case OBJ_ENCODING_EMBSTR: return "embstr";
    default: return "unknown";
    }
}

/* Given an object returns the min number of milliseconds the object was never
 * requested, using an approximated LRU algorithm. */
unsigned long long estimateObjectIdleTime(robj *o) {
    unsigned long long lruclock = LRU_CLOCK();
    if (lruclock >= o->lru) {
        return (lruclock - o->lru) * LRU_CLOCK_RESOLUTION;
    } else {
        return (lruclock + (LRU_CLOCK_MAX - o->lru)) *
                    LRU_CLOCK_RESOLUTION;
    }
}

/* Return the amount of memory used by the sds string at object->ptr
 * for a string object. */
size_t getStringObjectSdsUsedMemory(robj *o) {
    serverAssertWithInfo(NULL,o,o->type == OBJ_STRING);
    switch(o->encoding) {
    case OBJ_ENCODING_RAW: return sdsZmallocSize(o->ptr);
    case OBJ_ENCODING_EMBSTR: return dmalloc_size(o)-sizeof(robj);
    default: return 0; /* Just integer encoding for now. */
    }
}

/* This is a helper function for the OBJECT command. We need to lookup keys
 * without any modification of LRU or other parameters. */
robj *objectCommandLookup(client *c, robj *key) {
    dictEntry *de;

    if ((de = dictFind(c->db->dict,key->ptr)) == NULL) return NULL;
    return (robj*) dictGetVal(de);
}

robj *objectCommandLookupOrReply(client *c, robj *key, robj *reply) {
    robj *o = objectCommandLookup(c,key);

    if (!o) addReply(c, reply);
    return o;
}

/* Object command allows to inspect the internals of an Redis Object.
 * Usage: OBJECT <refcount|encoding|idletime> <key> */
void objectCommand(client *c) {
    robj *o;

    if (!strcasecmp(c->argv[1]->ptr,"encoding") && c->argc == 3) {
        fetchInternalDbByKey(c,c->argv[2]);
        lockDbRead(c->db);
        if ((o = objectCommandLookupOrReply(c,c->argv[2],shared.nullbulk))
                == NULL) {
            unlockDb(c->db);
            return;
        }
        addReplyBulkCString(c,strEncoding(o->encoding));
        unlockDb(c->db);
    } else if (!strcasecmp(c->argv[1]->ptr,"idletime") && c->argc == 3) {
        fetchInternalDbByKey(c,c->argv[2]);
        lockDbRead(c->db);
        if ((o = objectCommandLookupOrReply(c,c->argv[2],shared.nullbulk))
                == NULL) {
            unlockDb(c->db);
            return;
        }
        addReplyLongLong(c,estimateObjectIdleTime(o)/1000);
        unlockDb(c->db);
    } else {
        addReplyError(c,"Syntax error. Try OBJECT (encoding|idletime)");
    }
}


================================================
FILE: src/vr_object.h
================================================
#ifndef _VR_OBJECT_H_
#define _VR_OBJECT_H_

#define OBJ_SHARED_INTEGERS 10000
#define OBJ_SHARED_BULKHDR_LEN 32

/* Object types */
#define OBJ_STRING 0
#define OBJ_LIST 1
#define OBJ_SET 2
#define OBJ_ZSET 3
#define OBJ_HASH 4

/* Objects encoding. Some kind of objects like Strings and Hashes can be
 * internally represented in multiple ways. The 'encoding' field of the object
 * is set to one of this fields for this object. */
#define OBJ_ENCODING_RAW 0     /* Raw representation */
#define OBJ_ENCODING_INT 1     /* Encoded as integer */
#define OBJ_ENCODING_HT 2      /* Encoded as hash table */
#define OBJ_ENCODING_ZIPMAP 3  /* Encoded as zipmap */
#define OBJ_ENCODING_LINKEDLIST 4 /* Encoded as regular linked list */
#define OBJ_ENCODING_ZIPLIST 5 /* Encoded as ziplist */
#define OBJ_ENCODING_INTSET 6  /* Encoded as intset */
#define OBJ_ENCODING_SKIPLIST 7  /* Encoded as skiplist */
#define OBJ_ENCODING_EMBSTR 8  /* Embedded sds string encoding */
#define OBJ_ENCODING_QUICKLIST 9 /* Encoded as linked list of ziplists */

#define OBJ_HASH_KEY 1
#define OBJ_HASH_VALUE 2

#define sdsEncodedObject(objptr) (objptr->encoding == OBJ_ENCODING_RAW || objptr->encoding == OBJ_ENCODING_EMBSTR)

/* The actual Redis Object */
#define LRU_BITS 24
#define LRU_CLOCK_MAX ((1<<LRU_BITS)-1) /* Max value of obj->lru */
#define LRU_CLOCK_RESOLUTION 1000 /* LRU clock resolution in ms */
typedef struct vr_object {
    unsigned type:4;
    unsigned encoding:4;
    unsigned lru:LRU_BITS; /* lru time (relative to server.lruclock) */
    unsigned constant:1;
    int refcount;
    void *ptr;
} robj;

void decrRefCount(robj *o);
void decrRefCountVoid(void *o);
void incrRefCount(robj *o);
robj *resetRefCount(robj *obj);
void freeObject(robj *o);
void freeObjectVoid(void *o);
void freeStringObject(robj *o);
void freeListObject(robj *o);
void freeSetObject(robj *o);
void freeZsetObject(robj *o);
void freeHashObject(robj *o);
robj *createObject(int type, void *ptr);
robj *createStringObject(const char *ptr, size_t len);
robj *createRawStringObject(const char *ptr, size_t len);
robj *createEmbeddedStringObject(const char *ptr, size_t len);
robj *dupStringObject(robj *o);
robj *dupStringObjectUnconstant(robj *o);
int isObjectRepresentableAsLongLong(robj *o, long long *llongval);
robj *tryObjectEncoding(robj *o);
robj *getDecodedObject(robj *o);
size_t stringObjectLen(robj *o);
robj *createStringObjectFromLongLong(long long value);
robj *createStringObjectFromLongDouble(long double value, int humanfriendly);
robj *createQuicklistObject(void);
robj *createZiplistObject(void);
robj *createSetObject(void);
robj *createIntsetObject(void);
robj *createHashObject(void);
robj *createZsetObject(void);
robj *createZsetZiplistObject(void);
int getLongFromObjectOrReply(struct client *c, robj *o, long *target, const char *msg);
int checkType(struct client *c, robj *o, int type);
int getLongLongFromObjectOrReply(struct client *c, robj *o, long long *target, const char *msg);
int getDoubleFromObjectOrReply(struct client *c, robj *o, double *target, const char *msg);
int getLongLongFromObject(robj *o, long long *target);
int getLongDoubleFromObject(robj *o, long double *target);
int getLongDoubleFromObjectOrReply(struct client *c, robj *o, long double *target, const char *msg);
char *strEncoding(int encoding);
int compareStringObjects(robj *a, robj *b);
int collateStringObjects(robj *a, robj *b);
int equalStringObjects(robj *a, robj *b);
unsigned long long estimateObjectIdleTime(robj *o);

size_t getStringObjectSdsUsedMemory(robj *o);

robj *objectCommandLookup(struct client *c, robj *key);
robj *objectCommandLookupOrReply(struct client *c, robj *key, robj *reply);
void objectCommand(struct client *c);

#endif


================================================
FILE: src/vr_pubsub.c
================================================
#include <vr_core.h>

/* Unsubscribe a client from a channel. Returns 1 if the operation succeeded, or
 * 0 if the client was not subscribed to the specified channel. */
int pubsubUnsubscribeChannel(client *c, robj *channel, int notify) {
    dictEntry *de;
    dlist *clients;
    dlistNode *ln;
    int retval = 0;

    /* Remove the channel from the client -> channels hash table */
    incrRefCount(channel); /* channel may be just a pointer to the same object
                            we have in the hash tables. Protect it... */
    if (dictDelete(c->pubsub_channels,channel) == DICT_OK) {
        retval = 1;
        /* Remove the client from the channel -> clients list hash table */
        de = dictFind(c->vel->pubsub_channels,channel);
        serverAssertWithInfo(c,NULL,de != NULL);
        clients = dictGetVal(de);
        ln = dlistSearchKey(clients,c);
        serverAssertWithInfo(c,NULL,ln != NULL);
        dlistDelNode(clients,ln);
        if (dlistLength(clients) == 0) {
            /* Free the list and associated hash entry at all if this was
             * the latest client, so that it will be possible to abuse
             * Redis PUBSUB creating millions of channels. */
            dictDelete(c->vel->pubsub_channels,channel);
        }
    }
    /* Notify the client */
    if (notify) {
        addReply(c,shared.mbulkhdr[3]);
        addReply(c,shared.unsubscribebulk);
        addReplyBulk(c,channel);
        addReplyLongLong(c,dictSize(c->pubsub_channels)+
                       dlistLength(c->pubsub_patterns));

    }
    decrRefCount(channel); /* it is finally safe to release it */
    return retval;
}

/* Unsubscribe from all the channels. Return the number of channels the
 * client was subscribed to. */
int pubsubUnsubscribeAllChannels(client *c, int notify) {
    dictIterator *di = dictGetSafeIterator(c->pubsub_channels);
    dictEntry *de;
    int count = 0;

    while((de = dictNext(di)) != NULL) {
        robj *channel = dictGetKey(de);

        count += pubsubUnsubscribeChannel(c,channel,notify);
    }
    /* We were subscribed to nothing? Still reply to the client. */
    if (notify && count == 0) {
        addReply(c,shared.mbulkhdr[3]);
        addReply(c,shared.unsubscribebulk);
        addReply(c,shared.nullbulk);
        addReplyLongLong(c,dictSize(c->pubsub_channels)+
                       dlistLength(c->pubsub_patterns));
    }
    dictReleaseIterator(di);
    return count;
}

/* Unsubscribe a client from a channel. Returns 1 if the operation succeeded, or
 * 0 if the client was not subscribed to the specified channel. */
int pubsubUnsubscribePattern(client *c, robj *pattern, int notify) {
    dlistNode *ln;
    pubsubPattern pat;
    int retval = 0;

    incrRefCount(pattern); /* Protect the object. May be the same we remove */
    if ((ln = dlistSearchKey(c->pubsub_patterns,pattern)) != NULL) {
        retval = 1;
        dlistDelNode(c->pubsub_patterns,ln);
        pat.client = c;
        pat.pattern = pattern;
        ln = dlistSearchKey(c->vel->pubsub_patterns,&pat);
        dlistDelNode(c->vel->pubsub_patterns,ln);
    }
    /* Notify the client */
    if (notify) {
        addReply(c,shared.mbulkhdr[3]);
        addReply(c,shared.punsubscribebulk);
        addReplyBulk(c,pattern);
        addReplyLongLong(c,dictSize(c->pubsub_channels)+
                       dlistLength(c->pubsub_patterns));
    }
    decrRefCount(pattern);
    return retval;
}

/* Unsubscribe from all the patterns. Return the number of patterns the
 * client was subscribed from. */
int pubsubUnsubscribeAllPatterns(client *c, int notify) {
    dlistNode *ln;
    dlistIter li;
    int count = 0;

    dlistRewind(c->pubsub_patterns,&li);
    while ((ln = dlistNext(&li)) != NULL) {
        robj *pattern = ln->value;

        count += pubsubUnsubscribePattern(c,pattern,notify);
    }
    if (notify && count == 0) {
        /* We were subscribed to nothing? Still reply to the client. */
        addReply(c,shared.mbulkhdr[3]);
        addReply(c,shared.punsubscribebulk);
        addReply(c,shared.nullbulk);
        addReplyLongLong(c,dictSize(c->pubsub_channels)+
                       dlistLength(c->pubsub_patterns));
    }
    return count;
}

/*-----------------------------------------------------------------------------
 * Pubsub commands implementation
 *----------------------------------------------------------------------------*/


/* Subscribe a client to a channel. Returns 1 if the operation succeeded, or
 * 0 if the client was already subscribed to that channel. */
int pubsubSubscribeChannel(client *c, robj *channel) {
    dictEntry *de;
    dlist *clients = NULL;
    int retval = 0;

    /* Add the channel to the client -> channels hash table */
    if (dictAdd(c->pubsub_channels,channel,NULL) == DICT_OK) {
        retval = 1;
        incrRefCount(channel);
        /* Add the client to the channel -> list of clients hash table */
        de = dictFind(c->vel->pubsub_channels,channel);
        if (de == NULL) {
            clients = dlistCreate();
            dictAdd(c->vel->pubsub_channels,channel,clients);
            incrRefCount(channel);
        } else {
            clients = dictGetVal(de);
        }
        dlistAddNodeTail(clients,c);
    }
    /* Notify the client */
    addReply(c,shared.mbulkhdr[3]);
    addReply(c,shared.subscribebulk);
    addReplyBulk(c,channel);
    addReplyLongLong(c,clientSubscriptionsCount(c));
    return retval;
}

void subscribeCommand(client *c) {
    int j;

    for (j = 1; j < c->argc; j++)
        pubsubSubscribeChannel(c,c->argv[j]);
    c->flags |= CLIENT_PUBSUB;
}

/* Return the number of channels + patterns a client is subscribed to. */
int clientSubscriptionsCount(client *c) {
    return dictSize(c->pubsub_channels)+
           dlistLength(c->pubsub_patterns);
}

void unsubscribeCommand(client *c) {
    if (c->argc == 1) {
        pubsubUnsubscribeAllChannels(c,1);
    } else {
        int j;

        for (j = 1; j < c->argc; j++)
            pubsubUnsubscribeChannel(c,c->argv[j],1);
    }
    if (clientSubscriptionsCount(c) == 0) c->flags &= ~CLIENT_PUBSUB;
}

/* Subscribe a client to a pattern. Returns 1 if the operation succeeded, or 0 if the client was already subscribed to that pattern. */
int pubsubSubscribePattern(client *c, robj *pattern) {
    int retval = 0;

    if (dlistSearchKey(c->pubsub_patterns,pattern) == NULL) {
        retval = 1;
        pubsubPattern *pat;
        dlistAddNodeTail(c->pubsub_patterns,pattern);
        incrRefCount(pattern);
        pat = dalloc(sizeof(*pat));
        pat->pattern = getDecodedObject(pattern);
        pat->client = c;
        dlistAddNodeTail(c->vel->pubsub_patterns,pat);
    }
    /* Notify the client */
    addReply(c,shared.mbulkhdr[3]);
    addReply(c,shared.psubscribebulk);
    addReplyBulk(c,pattern);
    addReplyLongLong(c,clientSubscriptionsCount(c));
    return retval;
}

void psubscribeCommand(client *c) {
    int j;

    for (j = 1; j < c->argc; j++)
        pubsubSubscribePattern(c,c->argv[j]);
    c->flags |= CLIENT_PUBSUB;
}

void punsubscribeCommand(client *c) {
    if (c->argc == 1) {
        pubsubUnsubscribeAllPatterns(c,1);
    } else {
        int j;

        for (j = 1; j < c->argc; j++)
            pubsubUnsubscribePattern(c,c->argv[j],1);
    }
    if (clientSubscriptionsCount(c) == 0) c->flags &= ~CLIENT_PUBSUB;
}

/* Publish a message */
int pubsubPublishMessage(robj *channel, robj *message) {
    int receivers = 0;
    dictEntry *de;
    dlistNode *ln;
    dlistIter li;

    /* Send to clients listening for that channel */
    de = dictFind(server.pubsub_channels,channel);
    if (de) {
        dlist *list = dictGetVal(de);
        dlistNode *ln;
        dlistIter li;

        dlistRewind(list,&li);
        while ((ln = dlistNext(&li)) != NULL) {
            client *c = ln->value;

            addReply(c,shared.mbulkhdr[3]);
            addReply(c,shared.messagebulk);
            addReplyBulk(c,channel);
            addReplyBulk(c,message);
            receivers++;
        }
    }
    /* Send to clients listening to matching channels */
    if (dlistLength(server.pubsub_patterns)) {
        dlistRewind(server.pubsub_patterns,&li);
        channel = getDecodedObject(channel);
        while ((ln = dlistNext(&li)) != NULL) {
            pubsubPattern *pat = ln->value;

            if (stringmatchlen((char*)pat->pattern->ptr,
                                sdslen(pat->pattern->ptr),
                                (char*)channel->ptr,
                                sdslen(channel->ptr),0)) {
                addReply(pat->client,shared.mbulkhdr[4]);
                addReply(pat->client,shared.pmessagebulk);
                addReplyBulk(pat->client,pat->pattern);
                addReplyBulk(pat->client,channel);
                addReplyBulk(pat->client,message);
                receivers++;
            }
        }
        decrRefCount(channel);
    }
    return receivers;
}


================================================
FILE: src/vr_pubsub.h
================================================
#ifndef _VR_PUBSUB_H_
#define _VR_PUBSUB_H_

typedef struct pubsubPattern {
    client *client;
    robj *pattern;
} pubsubPattern;

int pubsubUnsubscribeChannel(client *c, robj *channel, int notify);
int pubsubUnsubscribeAllChannels(client *c, int notify);
int pubsubUnsubscribePattern(client *c, robj *pattern, int notify);
int pubsubUnsubscribeAllPatterns(client *c, int notify);
int pubsubSubscribeChannel(client *c, robj *channel);
int clientSubscriptionsCount(client *c);
void subscribeCommand(client *c);
void unsubscribeCommand(client *c);
void psubscribeCommand(client *c);
void punsubscribeCommand(client *c);
int pubsubSubscribePattern(client *c, robj *pattern);
int pubsubPublishMessage(robj *channel, robj *message);

#endif


================================================
FILE: src/vr_quicklist.c
================================================
#include <string.h> /* for memcpy */

#include <vr_core.h>

#if defined(REDIS_TEST) || defined(REDIS_TEST_VERBOSE)
#include <stdio.h> /* for printf (debug printing), snprintf (genstr) */
#endif

#ifndef REDIS_STATIC
#define REDIS_STATIC static
#endif

/* Optimization levels for size-based filling */
static const size_t optimization_level[] = {4096, 8192, 16384, 32768, 65536};

/* Maximum size in bytes of any multi-element ziplist.
 * Larger values will live in their own isolated ziplists. */
#define SIZE_SAFETY_LIMIT 8192

/* Minimum ziplist size in bytes for attempting compression. */
#define MIN_COMPRESS_BYTES 48

/* Minimum size reduction in bytes to store compressed quicklistNode data.
 * This also prevents us from storing compression if the compression
 * resulted in a larger size than the original data. */
#define MIN_COMPRESS_IMPROVE 8

/* If not verbose testing, remove all debug printing. */
#ifndef REDIS_TEST_VERBOSE
#define D(...)
#else
#define D(...)                                                                 \
    do {                                                                       \
        printf("%s:%s:%d:\t", __FILE__, __FUNCTION__, __LINE__);               \
        printf(__VA_ARGS__);                                                   \
        printf("\n");                                                          \
    } while (0);
#endif

/* Simple way to give quicklistEntry structs default values with one call. */
#define initEntry(e)                                                           \
    do {                                                                       \
        (e)->zi = (e)->value = NULL;                                           \
        (e)->longval = -123456789;                                             \
        (e)->quicklist = NULL;                                                 \
        (e)->node = NULL;                                                      \
        (e)->offset = 123456789;                                               \
        (e)->sz = 0;                                                           \
    } while (0)

#if __GNUC__ >= 3
#define likely(x) __builtin_expect(!!(x), 1)
#define unlikely(x) __builtin_expect(!!(x), 0)
#else
#define likely(x) (x)
#define unlikely(x) (x)
#endif

/* Create a new quicklist.
 * Free with quicklistRelease(). */
quicklist *quicklistCreate(void) {
    struct quicklist *quicklist;

    quicklist = dalloc(sizeof(*quicklist));
    quicklist->head = quicklist->tail = NULL;
    quicklist->len = 0;
    quicklist->count = 0;
    quicklist->compress = 0;
    quicklist->fill = -2;
    return quicklist;
}

#define COMPRESS_MAX (1 << 16)
void quicklistSetCompressDepth(quicklist *quicklist, int compress) {
    if (compress > COMPRESS_MAX) {
        compress = COMPRESS_MAX;
    } else if (compress < 0) {
        compress = 0;
    }
    quicklist->compress = compress;
}

#define FILL_MAX (1 << 15)
void quicklistSetFill(quicklist *quicklist, int fill) {
    if (fill > FILL_MAX) {
        fill = FILL_MAX;
    } else if (fill < -5) {
        fill = -5;
    }
    quicklist->fill = fill;
}

void quicklistSetOptions(quicklist *quicklist, int fill, int depth) {
    quicklistSetFill(quicklist, fill);
    quicklistSetCompressDepth(quicklist, depth);
}

/* Create a new quicklist with some default parameters. */
quicklist *quicklistNew(int fill, int compress) {
    quicklist *quicklist = quicklistCreate();
    quicklistSetOptions(quicklist, fill, compress);
    return quicklist;
}

REDIS_STATIC quicklistNode *quicklistCreateNode(void) {
    quicklistNode *node;
    node = dalloc(sizeof(*node));
    node->zl = NULL;
    node->count = 0;
    node->sz = 0;
    node->next = node->prev = NULL;
    node->encoding = QUICKLIST_NODE_ENCODING_RAW;
    node->container = QUICKLIST_NODE_CONTAINER_ZIPLIST;
    node->recompress = 0;
    return node;
}

/* Return cached quicklist count */
unsigned int quicklistCount(quicklist *ql) { return ql->count; }

/* Free entire quicklist. */
void quicklistRelease(quicklist *quicklist) {
    unsigned long len;
    quicklistNode *current, *next;

    current = quicklist->head;
    len = quicklist->len;
    while (len--) {
        next = current->next;

        dfree(current->zl);
        quicklist->count -= current->count;

        dfree(current);

        quicklist->len--;
        current = next;
    }
    dfree(quicklist);
}

/* Compress the ziplist in 'node' and update encoding details.
 * Returns 1 if ziplist compressed successfully.
 * Returns 0 if compression failed or if ziplist too small to compress. */
REDIS_STATIC int __quicklistCompressNode(quicklistNode *node) {
#ifdef REDIS_TEST
    node->attempted_compress = 1;
#endif

    /* Don't bother compressing small values */
    if (node->sz < MIN_COMPRESS_BYTES)
        return 0;

    quicklistLZF *lzf = dalloc(sizeof(*lzf) + node->sz);

    /* Cancel if compression fails or doesn't compress small enough */
    if (((lzf->sz = lzf_compress(node->zl, node->sz, lzf->compressed,
                                 node->sz)) == 0) ||
        lzf->sz + MIN_COMPRESS_IMPROVE >= node->sz) {
        /* lzf_compress aborts/rejects compression if value not compressable. */
        dfree(lzf);
        return 0;
    }
    lzf = drealloc(lzf, sizeof(*lzf) + lzf->sz);
    dfree(node->zl);
    node->zl = (unsigned char *)lzf;
    node->encoding = QUICKLIST_NODE_ENCODING_LZF;
    node->recompress = 0;
    return 1;
}

/* Compress only uncompressed nodes. */
#define quicklistCompressNode(_node)                                           \
    do {                                                                       \
        if ((_node) && (_node)->encoding == QUICKLIST_NODE_ENCODING_RAW) {     \
            __quicklistCompressNode((_node));                                  \
        }                                                                      \
    } while (0)

/* Uncompress the ziplist in 'node' and update encoding details.
 * Returns 1 on successful decode, 0 on failure to decode. */
REDIS_STATIC int __quicklistDecompressNode(quicklistNode *node) {
#ifdef REDIS_TEST
    node->attempted_compress = 0;
#endif

    void *decompressed = dalloc(node->sz);
    quicklistLZF *lzf = (quicklistLZF *)node->zl;
    if (lzf_decompress(lzf->compressed, lzf->sz, decompressed, node->sz) == 0) {
        /* Someone requested decompress, but we can't decompress.  Not good. */
        dfree(decompressed);
        return 0;
    }
    dfree(lzf);
    node->zl = decompressed;
    node->encoding = QUICKLIST_NODE_ENCODING_RAW;
    return 1;
}

/* Decompress only compressed nodes. */
#define quicklistDecompressNode(_node)                                         \
    do {                                                                       \
        if ((_node) && (_node)->encoding == QUICKLIST_NODE_ENCODING_LZF) {     \
            __quicklistDecompressNode((_node));                                \
        }                                                                      \
    } while (0)

/* Force node to not be immediately re-compresable */
#define quicklistDecompressNodeForUse(_node)                                   \
    do {                                                                       \
        if ((_node) && (_node)->encoding == QUICKLIST_NODE_ENCODING_LZF) {     \
            __quicklistDecompressNode((_node));                                \
            (_node)->recompress = 1;                                           \
        }                                                                      \
    } while (0)

/* Extract the raw LZF data from this quicklistNode.
 * Pointer to LZF data is assigned to '*data'.
 * Return value is the length of compressed LZF data. */
size_t quicklistGetLzf(const quicklistNode *node, void **data) {
    quicklistLZF *lzf = (quicklistLZF *)node->zl;
    *data = lzf->compressed;
    return lzf->sz;
}

#define quicklistAllowsCompression(_ql) ((_ql)->compress != 0)

/* Force 'quicklist' to meet compression guidelines set by compress depth.
 * The only way to guarantee interior nodes get compressed is to iterate
 * to our "interior" compress depth then compress the next node we find.
 * If compress depth is larger than the entire list, we return immediately. */
REDIS_STATIC void __quicklistCompress(const quicklist *quicklist,
                                      quicklistNode *node) {
    /* If length is less than our compress depth (from both sides),
     * we can't compress anything. */
    if (!quicklistAllowsCompression(quicklist) ||
        quicklist->len < (unsigned int)(quicklist->compress * 2))
        return;

#if 0
    /* Optimized cases for small depth counts */
    if (quicklist->compress == 1) {
        quicklistNode *h = quicklist->head, *t = quicklist->tail;
        quicklistDecompressNode(h);
        quicklistDecompressNode(t);
        if (h != node && t != node)
            quicklistCompressNode(node);
        return;
    } else if (quicklist->compress == 2) {
        quicklistNode *h = quicklist->head, *hn = h->next, *hnn = hn->next;
        quicklistNode *t = quicklist->tail, *tp = t->prev, *tpp = tp->prev;
        quicklistDecompressNode(h);
        quicklistDecompressNode(hn);
        quicklistDecompressNode(t);
        quicklistDecompressNode(tp);
        if (h != node && hn != node && t != node && tp != node) {
            quicklistCompressNode(node);
        }
        if (hnn != t) {
            quicklistCompressNode(hnn);
        }
        if (tpp != h) {
            quicklistCompressNode(tpp);
        }
        return;
    }
#endif

    /* Iterate until we reach compress depth for both sides of the list.a
     * Note: because we do length checks at the *top* of this function,
     *       we can skip explicit null checks below. Everything exists. */
    quicklistNode *forward = quicklist->head;
    quicklistNode *reverse = quicklist->tail;
    int depth = 0;
    int in_depth = 0;
    while (depth++ < quicklist->compress) {
        quicklistDecompressNode(forward);
        quicklistDecompressNode(reverse);

        if (forward == node || reverse == node)
            in_depth = 1;

        if (forward == reverse)
            return;

        forward = forward->next;
        reverse = reverse->prev;
    }

    if (!in_depth)
        quicklistCompressNode(node);

    if (depth > 2) {
        /* At this point, forward and reverse are one node beyond depth */
        quicklistCompressNode(forward);
        quicklistCompressNode(reverse);
    }
}

#define quicklistCompress(_ql, _node)                                          \
    do {                                                                       \
        if ((_node)->recompress)                                               \
            quicklistCompressNode((_node));                                    \
        else                                                                   \
            __quicklistCompress((_ql), (_node));                               \
    } while (0)

/* If we previously used quicklistDecompressNodeForUse(), just recompress. */
#define quicklistRecompressOnly(_ql, _node)                                    \
    do {                                                                       \
        if ((_node)->recompress)                                               \
            quicklistCompressNode((_node));                                    \
    } while (0)

/* Insert 'new_node' after 'old_node' if 'after' is 1.
 * Insert 'new_node' before 'old_node' if 'after' is 0.
 * Note: 'new_node' is *always* uncompressed, so if we assign it to
 *       head or tail, we do not need to uncompress it. */
REDIS_STATIC void __quicklistInsertNode(quicklist *quicklist,
                                        quicklistNode *old_node,
                                        quicklistNode *new_node, int after) {
    if (after) {
        new_node->prev = old_node;
        if (old_node) {
            new_node->next = old_node->next;
            if (old_node->next)
                old_node->next->prev = new_node;
            old_node->next = new_node;
        }
        if (quicklist->tail == old_node)
            quicklist->tail = new_node;
    } else {
        new_node->next = old_node;
        if (old_node) {
            new_node->prev = old_node->prev;
            if (old_node->prev)
                old_node->prev->next = new_node;
            old_node->prev = new_node;
        }
        if (quicklist->head == old_node)
            quicklist->head = new_node;
    }
    /* If this insert creates the only element so far, initialize head/tail. */
    if (quicklist->len == 0) {
        quicklist->head = quicklist->tail = new_node;
    }

    if (old_node)
        quicklistCompress(quicklist, old_node);

    quicklist->len++;
}

/* Wrappers for node inserting around existing node. */
REDIS_STATIC void _quicklistInsertNodeBefore(quicklist *quicklist,
                                             quicklistNode *old_node,
                                             quicklistNode *new_node) {
    __quicklistInsertNode(quicklist, old_node, new_node, 0);
}

REDIS_STATIC void _quicklistInsertNodeAfter(quicklist *quicklist,
                                            quicklistNode *old_node,
                                            quicklistNode *new_node) {
    __quicklistInsertNode(quicklist, old_node, new_node, 1);
}

REDIS_STATIC int
_quicklistNodeSizeMeetsOptimizationRequirement(const size_t sz,
                                               const int fill) {
    if (fill >= 0)
        return 0;

    size_t offset = (-fill) - 1;
    if (offset < (sizeof(optimization_level) / sizeof(*optimization_level))) {
        if (sz <= optimization_level[offset]) {
            return 1;
        } else {
            return 0;
        }
    } else {
        return 0;
    }
}

#define sizeMeetsSafetyLimit(sz) ((sz) <= SIZE_SAFETY_LIMIT)

REDIS_STATIC int _quicklistNodeAllowInsert(const quicklistNode *node,
                                           const int fill, const size_t sz) {
    if (unlikely(!node))
        return 0;

    int ziplist_overhead;
    /* size of previous offset */
    if (sz < 254)
        ziplist_overhead = 1;
    else
        ziplist_overhead = 5;

    /* size of forward offset */
    if (sz < 64)
        ziplist_overhead += 1;
    else if (likely(sz < 16384))
        ziplist_overhead += 2;
    else
        ziplist_overhead += 5;

    /* new_sz overestimates if 'sz' encodes to an integer type */
    unsigned int new_sz = node->sz + sz + ziplist_overhead;
    if (likely(_quicklistNodeSizeMeetsOptimizationRequirement(new_sz, fill)))
        return 1;
    else if (!sizeMeetsSafetyLimit(new_sz))
        return 0;
    else if ((int)node->count < fill)
        return 1;
    else
        return 0;
}

REDIS_STATIC int _quicklistNodeAllowMerge(const quicklistNode *a,
                                          const quicklistNode *b,
                                          const int fill) {
    if (!a || !b)
        return 0;

    /* approximate merged ziplist size (- 11 to remove one ziplist
     * header/trailer) */
    unsigned int merge_sz = a->sz + b->sz - 11;
    if (likely(_quicklistNodeSizeMeetsOptimizationRequirement(merge_sz, fill)))
        return 1;
    else if (!sizeMeetsSafetyLimit(merge_sz))
        return 0;
    else if ((int)(a->count + b->count) <= fill)
        return 1;
    else
        return 0;
}

#define quicklistNodeUpdateSz(node)                                            \
    do {                                                                       \
        (node)->sz = ziplistBlobLen((node)->zl);                               \
    } while (0)

/* Add new entry to head node of quicklist.
 *
 * Returns 0 if used existing head.
 * Returns 1 if new head created. */
int quicklistPushHead(quicklist *quicklist, void *value, size_t sz) {
    quicklistNode *orig_head = quicklist->head;
    if (likely(
            _quicklistNodeAllowInsert(quicklist->head, quicklist->fill, sz))) {
        quicklist->head->zl =
            ziplistPush(quicklist->head->zl, value, sz, ZIPLIST_HEAD);
        quicklistNodeUpdateSz(quicklist->head);
    } else {
        quicklistNode *node = quicklistCreateNode();
        node->zl = ziplistPush(ziplistNew(), value, sz, ZIPLIST_HEAD);

        quicklistNodeUpdateSz(node);
        _quicklistInsertNodeBefore(quicklist, quicklist->head, node);
    }
    quicklist->count++;
    quicklist->head->count++;
    return (orig_head != quicklist->head);
}

/* Add new entry to tail node of quicklist.
 *
 * Returns 0 if used existing tail.
 * Returns 1 if new tail created. */
int quicklistPushTail(quicklist *quicklist, void *value, size_t sz) {
    quicklistNode *orig_tail = quicklist->tail;
    if (likely(
            _quicklistNodeAllowInsert(quicklist->tail, quicklist->fill, sz))) {
        quicklist->tail->zl =
            ziplistPush(quicklist->tail->zl, value, sz, ZIPLIST_TAIL);
        quicklistNodeUpdateSz(quicklist->tail);
    } else {
        quicklistNode *node = quicklistCreateNode();
        node->zl = ziplistPush(ziplistNew(), value, sz, ZIPLIST_TAIL);

        quicklistNodeUpdateSz(node);
        _quicklistInsertNodeAfter(quicklist, quicklist->tail, node);
    }
    quicklist->count++;
    quicklist->tail->count++;
    return (orig_tail != quicklist->tail);
}

/* Create new node consisting of a pre-formed ziplist.
 * Used for loading RDBs where entire ziplists have been stored
 * to be retrieved later. */
void quicklistAppendZiplist(quicklist *quicklist, unsigned char *zl) {
    quicklistNode *node = quicklistCreateNode();

    node->zl = zl;
    node->count = ziplistLen(node->zl);
    node->sz = ziplistBlobLen(zl);

    _quicklistInsertNodeAfter(quicklist, quicklist->tail, node);
    quicklist->count += node->count;
}

/* Append all values of ziplist 'zl' individually into 'quicklist'.
 *
 * This allows us to restore old RDB ziplists into new quicklists
 * with smaller ziplist sizes than the saved RDB ziplist.
 *
 * Returns 'quicklist' argument. Frees passed-in ziplist 'zl' */
quicklist *quicklistAppendValuesFromZiplist(quicklist *quicklist,
                                            unsigned char *zl) {
    unsigned char *value;
    unsigned int sz;
    long long longval;
    char longstr[32] = {0};

    unsigned char *p = ziplistIndex(zl, 0);
    while (ziplistGet(p, &value, &sz, &longval)) {
        if (!value) {
            /* Write the longval as a string so we can re-add it */
            sz = ll2string(longstr, sizeof(longstr), longval);
            value = (unsigned char *)longstr;
        }
        quicklistPushTail(quicklist, value, sz);
        p = ziplistNext(zl, p);
    }
    dfree(zl);
    return quicklist;
}

/* Create new (potentially multi-node) quicklist from a single existing ziplist.
 *
 * Returns new quicklist.  Frees passed-in ziplist 'zl'. */
quicklist *quicklistCreateFromZiplist(int fill, int compress,
                                      unsigned char *zl) {
    return quicklistAppendValuesFromZiplist(quicklistNew(fill, compress), zl);
}

#define quicklistDeleteIfEmpty(ql, n)                                          \
    do {                                                                       \
        if ((n)->count == 0) {                                                 \
            __quicklistDelNode((ql), (n));                                     \
            (n) = NULL;                                                        \
        }                                                                      \
    } while (0)

REDIS_STATIC void __quicklistDelNode(quicklist *quicklist,
                                     quicklistNode *node) {
    if (node->next)
        node->next->prev = node->prev;
    if (node->prev)
        node->prev->next = node->next;

    if (node == quicklist->tail) {
        quicklist->tail = node->prev;
    }

    if (node == quicklist->head) {
        quicklist->head = node->next;
    }

    /* If we deleted a node within our compress depth, we
     * now have compressed nodes needing to be decompressed. */
    __quicklistCompress(quicklist, NULL);

    quicklist->count -= node->count;

    dfree(node->zl);
    dfree(node);
    quicklist->len--;
}

/* Delete one entry from list given the node for the entry and a pointer
 * to the entry in the node.
 *
 * Note: quicklistDelIndex() *requires* uncompressed nodes because you
 *       already had to get *p from an uncompressed node somewhere.
 *
 * Returns 1 if the entire node was deleted, 0 if node still exists.
 * Also updates in/out param 'p' with the next offset in the ziplist. */
REDIS_STATIC int quicklistDelIndex(quicklist *quicklist, quicklistNode *node,
                                   unsigned char **p) {
    int gone = 0;

    node->zl = ziplistDelete(node->zl, p);
    node->count--;
    if (node->count == 0) {
        gone = 1;
        __quicklistDelNode(quicklist, node);
    } else {
        quicklistNodeUpdateSz(node);
    }
    quicklist->count--;
    /* If we deleted the node, the original node is no longer valid */
    return gone ? 1 : 0;
}

/* Delete one element represented by 'entry'
 *
 * 'entry' stores enough metadata to delete the proper position in
 * the correct ziplist in the correct quicklist node. */
void quicklistDelEntry(quicklistIter *iter, quicklistEntry *entry) {
    quicklistNode *prev = entry->node->prev;
    quicklistNode *next = entry->node->next;
    int deleted_node = quicklistDelIndex((quicklist *)entry->quicklist,
                                         entry->node, &entry->zi);

    /* after delete, the zi is now invalid for any future usage. */
    iter->zi = NULL;

    /* If current node is deleted, we must update iterator node and offset. */
    if (deleted_node) {
        if (iter->direction == AL_START_HEAD) {
            iter->current = next;
            iter->offset = 0;
        } else if (iter->direction == AL_START_TAIL) {
            iter->current = prev;
            iter->offset = -1;
        }
    }
    /* else if (!deleted_node), no changes needed.
     * we already reset iter->zi above, and the existing iter->offset
     * doesn't move again because:
     *   - [1, 2, 3] => delete offset 1 => [1, 3]: next element still offset 1
     *   - [1, 2, 3] => delete offset 0 => [2, 3]: next element still offset 0
     *  if we deleted the last element at offet N and now
     *  length of this ziplist is N-1, the next call into
     *  quicklistNext() will jump to the next node. */
}

/* Replace quicklist entry at offset 'index' by 'data' with length 'sz'.
 *
 * Returns 1 if replace happened.
 * Returns 0 if replace failed and no changes happened. */
int quicklistReplaceAtIndex(quicklist *quicklist, long index, void *data,
                            int sz) {
    quicklistEntry entry;
    if (likely(quicklistIndex(quicklist, index, &entry))) {
        /* quicklistIndex provides an uncompressed node */
        entry.node->zl = ziplistDelete(entry.node->zl, &entry.zi);
        entry.node->zl = ziplistInsert(entry.node->zl, entry.zi, data, sz);
        quicklistCompress(quicklist, entry.node);
        return 1;
    } else {
        return 0;
    }
}

/* Given two nodes, try to merge their ziplists.
 *
 * This helps us not have a quicklist with 3 element ziplists if
 * our fill factor can handle much higher levels.
 *
 * Note: 'a' must be to the LEFT of 'b'.
 *
 * After calling this function, both 'a' and 'b' should be considered
 * unusable.  The return value from this function must be used
 * instead of re-using any of the quicklistNode input arguments.
 *
 * Returns the input node picked to merge against or NULL if
 * merging was not possible. */
REDIS_STATIC quicklistNode *_quicklistZiplistMerge(quicklist *quicklist,
                                                   quicklistNode *a,
                                                   quicklistNode *b) {
    D("Requested merge (a,b) (%u, %u)", a->count, b->count);

    quicklistDecompressNode(a);
    quicklistDecompressNode(b);
    if ((ziplistMerge(&a->zl, &b->zl))) {
        /* We merged ziplists! Now remove the unused quicklistNode. */
        quicklistNode *keep = NULL, *nokeep = NULL;
        if (!a->zl) {
            nokeep = a;
            keep = b;
        } else if (!b->zl) {
            nokeep = b;
            keep = a;
        }
        keep->count = ziplistLen(keep->zl);
        quicklistNodeUpdateSz(keep);

        nokeep->count = 0;
        __quicklistDelNode(quicklist, nokeep);
        quicklistCompress(quicklist, keep);
        return keep;
    } else {
        /* else, the merge returned NULL and nothing changed. */
        return NULL;
    }
}

/* Attempt to merge ziplists within two nodes on either side of 'center'.
 *
 * We attempt to merge:
 *   - (center->prev->prev, center->prev)
 *   - (center->next, center->next->next)
 *   - (center->prev, center)
 *   - (center, center->next)
 */
REDIS_STATIC void _quicklistMergeNodes(quicklist *quicklist,
                                       quicklistNode *center) {
    int fill = quicklist->fill;
    quicklistNode *prev, *prev_prev, *next, *next_next, *target;
    prev = prev_prev = next = next_next = target = NULL;

    if (center->prev) {
        prev = center->prev;
        if (center->prev->prev)
            prev_prev = center->prev->prev;
    }

    if (center->next) {
        next = center->next;
        if (center->next->next)
            next_next = center->next->next;
    }

    /* Try to merge prev_prev and prev */
    if (_quicklistNodeAllowMerge(prev, prev_prev, fill)) {
        _quicklistZiplistMerge(quicklist, prev_prev, prev);
        prev_prev = prev = NULL; /* they could have moved, invalidate them. */
    }

    /* Try to merge next and next_next */
    if (_quicklistNodeAllowMerge(next, next_next, fill)) {
        _quicklistZiplistMerge(quicklist, next, next_next);
        next = next_next = NULL; /* they could have moved, invalidate them. */
    }

    /* Try to merge center node and previous node */
    if (_quicklistNodeAllowMerge(center, center->prev, fill)) {
        target = _quicklistZiplistMerge(quicklist, center->prev, center);
        center = NULL; /* center could have been deleted, invalidate it. */
    } else {
        /* else, we didn't merge here, but target needs to be valid below. */
        target = center;
    }

    /* Use result of center merge (or original) to merge with next node. */
    if (_quicklistNodeAllowMerge(target, target->next, fill)) {
        _quicklistZiplistMerge(quicklist, target, target->next);
    }
}

/* Split 'node' into two parts, parameterized by 'offset' and 'after'.
 *
 * The 'after' argument controls which quicklistNode gets returned.
 * If 'after'==1, returned node has elements after 'offset'.
 *                input node keeps elements up to 'offset', including 'offset'.
 * If 'after'==0, returned node has elements up to 'offset', including 'offset'.
 *                input node keeps elements after 'offset'.
 *
 * If 'after'==1, returned node will have elements _after_ 'offset'.
 *                The returned node will have elements [OFFSET+1, END].
 *                The input node keeps elements [0, OFFSET].
 *
 * If 'after'==0, returned node will keep elements up to and including 'offset'.
 *                The returned node will have elements [0, OFFSET].
 *                The input node keeps elements [OFFSET+1, END].
 *
 * The input node keeps all elements not taken by the returned node.
 *
 * Returns newly created node or NULL if split not possible. */
REDIS_STATIC quicklistNode *_quicklistSplitNode(quicklistNode *node, int offset,
                                                int after) {
    size_t zl_sz = node->sz;

    quicklistNode *new_node = quicklistCreateNode();
    new_node->zl = dalloc(zl_sz);

    /* Copy original ziplist so we can split it */
    memcpy(new_node->zl, node->zl, zl_sz);

    /* -1 here means "continue deleting until the list ends" */
    int orig_start = after ? offset + 1 : 0;
    int orig_extent = after ? -1 : offset;
    int new_start = after ? 0 : offset;
    int new_extent = after ? offset + 1 : -1;

    D("After %d (%d); ranges: [%d, %d], [%d, %d]", after, offset, orig_start,
      orig_extent, new_start, new_extent);

    node->zl = ziplistDeleteRange(node->zl, orig_start, orig_extent);
    node->count = ziplistLen(node->zl);
    quicklistNodeUpdateSz(node);

    new_node->zl = ziplistDeleteRange(new_node->zl, new_start, new_extent);
    new_node->count = ziplistLen(new_node->zl);
    quicklistNodeUpdateSz(new_node);

    D("After split lengths: orig (%d), new (%d)", node->count, new_node->count);
    return new_node;
}

/* Insert a new entry before or after existing entry 'entry'.
 *
 * If after==1, the new value is inserted after 'entry', otherwise
 * the new value is inserted before 'entry'. */
REDIS_STATIC void _quicklistInsert(quicklist *quicklist, quicklistEntry *entry,
                                   void *value, const size_t sz, int after) {
    int full = 0, at_tail = 0, at_head = 0, full_next = 0, full_prev = 0;
    int fill = quicklist->fill;
    quicklistNode *node = entry->node;
    quicklistNode *new_node = NULL;

    if (!node) {
        /* we have no reference node, so let's create only node in the list */
        D("No node given!");
        new_node = quicklistCreateNode();
        new_node->zl = ziplistPush(ziplistNew(), value, sz, ZIPLIST_HEAD);
        __quicklistInsertNode(quicklist, NULL, new_node, after);
        new_node->count++;
        quicklist->count++;
        return;
    }

    /* Populate accounting flags for easier boolean checks later */
    if (!_quicklistNodeAllowInsert(node, fill, sz)) {
        D("Current node is full with count %d with requested fill %lu",
          node->count, fill);
        full = 1;
    }

    if (after && (entry->offset == node->count)) {
        D("At Tail of current ziplist");
        at_tail = 1;
        if (!_quicklistNodeAllowInsert(node->next, fill, sz)) {
            D("Next node is full too.");
            full_next = 1;
        }
    }

    if (!after && (entry->offset == 0)) {
        D("At Head");
        at_head = 1;
        if (!_quicklistNodeAllowInsert(node->prev, fill, sz)) {
            D("Prev node is full too.");
            full_prev = 1;
        }
    }

    /* Now determine where and how to insert the new element */
    if (!full && after) {
        D("Not full, inserting after current position.");
        quicklistDecompressNodeForUse(node);
        unsigned char *next = ziplistNext(node->zl, entry->zi);
        if (next == NULL) {
            node->zl = ziplistPush(node->zl, value, sz, ZIPLIST_TAIL);
        } else {
            node->zl = ziplistInsert(node->zl, next, value, sz);
        }
        node->count++;
        quicklistNodeUpdateSz(node);
        quicklistRecompressOnly(quicklist, node);
    } else if (!full && !after) {
        D("Not full, inserting before current position.");
        quicklistDecompressNodeForUse(node);
        node->zl = ziplistInsert(node->zl, entry->zi, value, sz);
        node->count++;
        quicklistNodeUpdateSz(node);
        quicklistRecompressOnly(quicklist, node);
    } else if (full && at_tail && node->next && !full_next && after) {
        /* If we are: at tail, next has free space, and inserting after:
         *   - insert entry at head of next node. */
        D("Full and tail, but next isn't full; inserting next node head");
        new_node = node->next;
        quicklistDecompressNodeForUse(new_node);
        new_node->zl = ziplistPush(new_node->zl, value, sz, ZIPLIST_HEAD);
        new_node->count++;
        quicklistNodeUpdateSz(new_node);
        quicklistRecompressOnly(quicklist, new_node);
    } else if (full && at_head && node->prev && !full_prev && !after) {
        /* If we are: at head, previous has free space, and inserting before:
         *   - insert entry at tail of previous node. */
        D("Full and head, but prev isn't full, inserting prev node tail");
        new_node = node->prev;
        quicklistDecompressNodeForUse(new_node);
        new_node->zl = ziplistPush(new_node->zl, value, sz, ZIPLIST_TAIL);
        new_node->count++;
        quicklistNodeUpdateSz(new_node);
        quicklistRecompressOnly(quicklist, new_node);
    } else if (full && ((at_tail && node->next && full_next && after) ||
                        (at_head && node->prev && full_prev && !after))) {
        /* If we are: full, and our prev/next is full, then:
         *   - create new node and attach to quicklist */
        D("\tprovisioning new node...");
        new_node = quicklistCreateNode();
        new_node->zl = ziplistPush(ziplistNew(), value, sz, ZIPLIST_HEAD);
        new_node->count++;
        quicklistNodeUpdateSz(new_node);
        __quicklistInsertNode(quicklist, node, new_node, after);
    } else if (full) {
        /* else, node is full we need to split it. */
        /* covers both after and !after cases */
        D("\tsplitting node...");
        quicklistDecompressNodeForUse(node);
        new_node = _quicklistSplitNode(node, entry->offset, after);
        new_node->zl = ziplistPush(new_node->zl, value, sz,
                                   after ? ZIPLIST_HEAD : ZIPLIST_TAIL);
        new_node->count++;
        quicklistNodeUpdateSz(new_node);
        __quicklistInsertNode(quicklist, node, new_node, after);
        _quicklistMergeNodes(quicklist, node);
    }

    quicklist->count++;
}

void quicklistInsertBefore(quicklist *quicklist, quicklistEntry *entry,
                           void *value, const size_t sz) {
    _quicklistInsert(quicklist, entry, value, sz, 0);
}

void quicklistInsertAfter(quicklist *quicklist, quicklistEntry *entry,
                          void *value, const size_t sz) {
    _quicklistInsert(quicklist, entry, value, sz, 1);
}

/* Delete a range of elements from the quicklist.
 *
 * elements may span across multiple quicklistNodes, so we
 * have to be careful about tracking where we start and end.
 *
 * Returns 1 if entries were deleted, 0 if nothing was deleted. */
int quicklistDelRange(quicklist *quicklist, const long start,
                      const long count) {
    if (count <= 0)
        return 0;

    unsigned long extent = count; /* range is inclusive of start position */

    if (start >= 0 && extent > (quicklist->count - start)) {
        /* if requesting delete more elements than exist, limit to list size. */
        extent = quicklist->count - start;
    } else if (start < 0 && extent > (unsigned long)(-start)) {
        /* else, if at negative offset, limit max size to rest of list. */
        extent = -start; /* c.f. LREM -29 29; just delete until end. */
    }

    quicklistEntry entry;
    if (!quicklistIndex(quicklist, start, &entry))
        return 0;

    D("Quicklist delete request for start %ld, count %ld, extent: %ld", start,
      count, extent);
    quicklistNode *node = entry.node;

    /* iterate over next nodes until everything is deleted. */
    while (extent) {
        quicklistNode *next = node->next;

        unsigned long del;
        int delete_entire_node = 0;
        if (entry.offset == 0 && extent >= node->count) {
            /* If we are deleting more than the count of this node, we
             * can just delete the entire node without ziplist math. */
            delete_entire_node = 1;
            del = node->count;
        } else if (entry.offset >= 0 && extent >= node->count) {
            /* If deleting more nodes after this one, calculate delete based
             * on size of current node. */
            del = node->count - entry.offset;
        } else if (entry.offset < 0) {
            /* If offset is negative, we are in the first run of this loop
             * and we are deleting the entire range
             * from this start offset to end of list.  Since the Negative
             * offset is the number of elements until the tail of the list,
             * just use it directly as the deletion count. */
            del = -entry.offset;

            /* If the positive offset is greater than the remaining extent,
             * we only delete the remaining extent, not the entire offset.
             */
            if (del > extent)
                del = extent;
        } else {
            /* else, we are deleting less than the extent of this node, so
             * use extent directly. */
            del = extent;
        }

        D("[%ld]: asking to del: %ld because offset: %d; (ENTIRE NODE: %d), "
          "node count: %u",
          extent, del, entry.offset, delete_entire_node, node->count);

        if (delete_entire_node) {
            __quicklistDelNode(quicklist, node);
        } else {
            quicklistDecompressNodeForUse(node);
            node->zl = ziplistDeleteRange(node->zl, entry.offset, del);
            quicklistNodeUpdateSz(node);
            node->count -= del;
            quicklist->count -= del;
            quicklistDeleteIfEmpty(quicklist, node);
            if (node)
                quicklistRecompressOnly(quicklist, node);
        }

        extent -= del;

        node = next;

        entry.offset = 0;
    }
    return 1;
}

/* Passthrough to ziplistCompare() */
int quicklistCompare(unsigned char *p1, unsigned char *p2, int p2_len) {
    return ziplistCompare(p1, p2, p2_len);
}

/* Returns a quicklist iterator 'iter'. After the initialization every
 * call to quicklistNext() will return the next element of the quicklist. */
quicklistIter *quicklistGetIterator(const quicklist *quicklist, int direction) {
    quicklistIter *iter;

    iter = dalloc(sizeof(*iter));

    if (direction == AL_START_HEAD) {
        iter->current = quicklist->head;
        iter->offset = 0;
    } else if (direction == AL_START_TAIL) {
        iter->current = quicklist->tail;
        iter->offset = -1;
    }

    iter->direction = direction;
    iter->quicklist = quicklist;

    iter->zi = NULL;

    return iter;
}

/* Initialize an iterator at a specific offset 'idx' and make the iterator
 * return nodes in 'direction' direction. */
quicklistIter *quicklistGetIteratorAtIdx(const quicklist *quicklist,
                                         const int direction,
                                         const long long idx) {
    quicklistEntry entry;

    if (quicklistIndex(quicklist, idx, &entry)) {
        quicklistIter *base = quicklistGetIterator(quicklist, direction);
        base->zi = NULL;
        base->current = entry.node;
        base->offset = entry.offset;
        return base;
    } else {
        return NULL;
    }
}

/* Release iterator.
 * If we still have a valid current node, then re-encode current node. */
void quicklistReleaseIterator(quicklistIter *iter) {
    if (iter->current)
        quicklistCompress(iter->quicklist, iter->current);

    dfree(iter);
}

/* Get next element in iterator.
 *
 * Note: You must NOT insert into the list while iterating over it.
 * You *may* delete from the list while iterating using the
 * quicklistDelEntry() function.
 * If you insert into the quicklist while iterating, you should
 * re-create the iterator after your addition.
 *
 * iter = quicklistGetIterator(quicklist,<direction>);
 * quicklistEntry entry;
 * while (quicklistNext(iter, &entry)) {
 *     if (entry.value)
 *          [[ use entry.value with entry.sz ]]
 *     else
 *          [[ use entry.longval ]]
 * }
 *
 * Populates 'entry' with values for this iteration.
 * Returns 0 when iteration is complete or if iteration not possible.
 * If return value is 0, the contents of 'entry' are not valid.
 */
int quicklistNext(quicklistIter *iter, quicklistEntry *entry) {
    initEntry(entry);

    if (!iter) {
        D("Returning because no iter!");
        return 0;
    }

    entry->quicklist = iter->quicklist;
    entry->node = iter->current;

    if (!iter->current) {
        D("Returning because current node is NULL")
        return 0;
    }

    unsigned char *(*nextFn)(unsigned char *, unsigned char *) = NULL;
    int offset_update = 0;

    if (!iter->zi) {
        /* If !zi, use current index. */
        quicklistDecompressNodeForUse(iter->current);
        iter->zi = ziplistIndex(iter->current->zl, iter->offset);
    } else {
        /* else, use existing iterator offset and get prev/next as necessary. */
        if (iter->direction == AL_START_HEAD) {
            nextFn = ziplistNext;
            offset_update = 1;
        } else if (iter->direction == AL_START_TAIL) {
            nextFn = ziplistPrev;
            offset_update = -1;
        }
        iter->zi = nextFn(iter->current->zl, iter->zi);
        iter->offset += offset_update;
    }

    entry->zi = iter->zi;
    entry->offset = iter->offset;

    if (iter->zi) {
        /* Populate value from existing ziplist position */
        ziplistGet(entry->zi, &entry->value, &entry->sz, &entry->longval);
        return 1;
    } else {
        /* We ran out of ziplist entries.
         * Pick next node, update offset, then re-run retrieval. */
        quicklistCompress(iter->quicklist, iter->current);
        if (iter->direction == AL_START_HEAD) {
            /* Forward traversal */
            D("Jumping to start of next node");
            iter->current = iter->current->next;
            iter->offset = 0;
        } else if (iter->direction == AL_START_TAIL) {
            /* Reverse traversal */
            D("Jumping to end of previous node");
            iter->current = iter->current->prev;
            iter->offset = -1;
        }
        iter->zi = NULL;
        return quicklistNext(iter, entry);
    }
}

/* Duplicate the quicklist.
 * On success a copy of the original quicklist is returned.
 *
 * The original quicklist both on success or error is never modified.
 *
 * Returns newly allocated quicklist. */
quicklist *quicklistDup(quicklist *orig) {
    quicklist *copy;
    quicklistNode *current;

    copy = quicklistNew(orig->fill, orig->compress);

    for (current = orig->head; current;
         current = current->next) {
        quicklistNode *node = quicklistCreateNode();

        if (node->encoding == QUICKLIST_NODE_ENCODING_LZF) {
            quicklistLZF *lzf = (quicklistLZF *)node->zl;
            size_t lzf_sz = sizeof(*lzf) + lzf->sz;
            node->zl = dalloc(lzf_sz);
            memcpy(node->zl, current->zl, lzf_sz);
        } else if (node->encoding == QUICKLIST_NODE_ENCODING_RAW) {
            node->zl = dalloc(current->sz);
            memcpy(node->zl, current->zl, current->sz);
        }

        node->count = current->count;
        copy->count += node->count;
        node->sz = current->sz;
        node->encoding = current->encoding;

        _quicklistInsertNodeAfter(copy, copy->tail, node);
    }

    /* copy->count must equal orig->count here */
    return copy;
}

/* Populate 'entry' with the element at the specified zero-based index
 * where 0 is the head, 1 is the element next to head
 * and so on. Negative integers are used in order to count
 * from the tail, -1 is the last element, -2 the penultimate
 * and so on. If the index is out of range 0 is returned.
 *
 * Returns 1 if element found
 * Returns 0 if element not found */
int quicklistIndex(const quicklist *quicklist, const long long idx,
                   quicklistEntry *entry) {
    quicklistNode *n;
    unsigned long long accum = 0;
    unsigned long long index;
    int forward = idx < 0 ? 0 : 1; /* < 0 -> reverse, 0+ -> forward */

    initEntry(entry);
    entry->quicklist = quicklist;

    if (!forward) {
        index = (-idx) - 1;
        n = quicklist->tail;
    } else {
        index = idx;
        n = quicklist->head;
    }

    if (index >= quicklist->count)
        return 0;

    while (likely(n)) {
        if ((accum + n->count) > index) {
            break;
        } else {
            D("Skipping over (%p) %u at accum %lld", (void *)n, n->count,
              accum);
            accum += n->count;
            n = forward ? n->next : n->prev;
        }
    }

    if (!n)
        return 0;

    D("Found node: %p at accum %llu, idx %llu, sub+ %llu, sub- %llu", (void *)n,
      accum, index, index - accum, (-index) - 1 + accum);

    entry->node = n;
    if (forward) {
        /* forward = normal head-to-tail offset. */
        entry->offset = index - accum;
    } else {
        /* reverse = need negative offset for tail-to-head, so undo
         * the result of the original if (index < 0) above. */
        entry->offset = (-index) - 1 + accum;
    }

    quicklistDecompressNodeForUse(entry->node);
    entry->zi = ziplistIndex(entry->node->zl, entry->offset);
    ziplistGet(entry->zi, &entry->value, &entry->sz, &entry->longval);
    /* The caller will use our result, so we don't re-compress here.
     * The caller can recompress or delete the node as needed. */
    return 1;
}

/* Rotate quicklist by moving the tail element to the head. */
void quicklistRotate(quicklist *quicklist) {
    if (quicklist->count <= 1)
        return;

    /* First, get the tail entry */
    unsigned char *p = ziplistIndex(quicklist->tail->zl, -1);
    unsigned char *value;
    long long longval;
    unsigned int sz;
    char longstr[32] = {0};
    ziplistGet(p, &value, &sz, &longval);

    /* If value found is NULL, then ziplistGet populated longval instead */
    if (!value) {
        /* Write the longval as a string so we can re-add it */
        sz = ll2string(longstr, sizeof(longstr), longval);
        value = (unsigned char *)longstr;
    }

    /* Add tail entry to head (must happen before tail is deleted). */
    quicklistPushHead(quicklist, value, sz);

    /* If quicklist has only one node, the head ziplist is also the
     * tail ziplist and PushHead() could have reallocated our single ziplist,
     * which would make our pre-existing 'p' unusable. */
    if (quicklist->len == 1) {
        p = ziplistIndex(quicklist->tail->zl, -1);
    }

    /* Remove tail entry. */
    quicklistDelIndex(quicklist, quicklist->tail, &p);
}

/* pop from quicklist and return result in 'data' ptr.  Value of 'data'
 * is the return value of 'saver' function pointer if the data is NOT a number.
 *
 * If the quicklist element is a long long, then the return value is returned in
 * 'sval'.
 *
 * Return value of 0 means no elements available.
 * Return value of 1 means check 'data' and 'sval' for values.
 * If 'data' is set, use 'data' and 'sz'.  Otherwise, use 'sval'. */
int quicklistPopCustom(quicklist *quicklist, int where, unsigned char **data,
                       unsigned int *sz, long long *sval,
                       void *(*saver)(unsigned char *data, unsigned int sz)) {
    unsigned char *p;
    unsigned char *vstr;
    unsigned int vlen;
    long long vlong;
    int pos = (where == QUICKLIST_HEAD) ? 0 : -1;

    if (quicklist->count == 0)
        return 0;

    if (data)
        *data = NULL;
    if (sz)
        *sz = 0;
    if (sval)
        *sval = -123456789;

    quicklistNode *node;
    if (where == QUICKLIST_HEAD && quicklist->head) {
        node = quicklist->head;
    } else if (where == QUICKLIST_TAIL && quicklist->tail) {
        node = quicklist->tail;
    } else {
        return 0;
    }

    p = ziplistIndex(node->zl, pos);
    if (ziplistGet(p, &vstr, &vlen, &vlong)) {
        if (vstr) {
            if (data)
                *data = saver(vstr, vlen);
            if (sz)
                *sz = vlen;
        } else {
            if (data)
                *data = NULL;
            if (sval)
                *sval = vlong;
        }
        quicklistDelIndex(quicklist, node, &p);
        return 1;
    }
    return 0;
}

/* Return a malloc'd copy of data passed in */
REDIS_STATIC void *_quicklistSaver(unsigned char *data, unsigned int sz) {
    unsigned char *vstr;
    if (data) {
        vstr = dalloc(sz);
        memcpy(vstr, data, sz);
        return vstr;
    }
    return NULL;
}

/* Default pop function
 *
 * Returns malloc'd value from quicklist */
int quicklistPop(quicklist *quicklist, int where, unsigned char **data,
                 unsigned int *sz, long long *slong) {
    unsigned char *vstr;
    unsigned int vlen;
    long long vlong;
    if (quicklist->count == 0)
        return 0;
    int ret = quicklistPopCustom(quicklist, where, &vstr, &vlen, &vlong,
                                 _quicklistSaver);
    if (data)
        *data = vstr;
    if (slong)
        *slong = vlong;
    if (sz)
        *sz = vlen;
    return ret;
}

/* Wrapper to allow argument-based switching between HEAD/TAIL pop */
void quicklistPush(quicklist *quicklist, void *value, const size_t sz,
                   int where) {
    if (where == QUICKLIST_HEAD) {
        quicklistPushHead(quicklist, value, sz);
    } else if (where == QUICKLIST_TAIL) {
        quicklistPushTail(quicklist, value, sz);
    }
}


================================================
FILE: src/vr_quicklist.h
================================================
#ifndef _VR_QUICKLIST_H_
#define _VR_QUICKLIST_H_

/* Node, quicklist, and Iterator are the only data structures used currently. */

/* quicklistNode is a 32 byte struct describing a ziplist for a quicklist.
 * We use bit fields keep the quicklistNode at 32 bytes.
 * count: 16 bits, max 65536 (max zl bytes is 65k, so max count actually < 32k).
 * encoding: 2 bits, RAW=1, LZF=2.
 * container: 2 bits, NONE=1, ZIPLIST=2.
 * recompress: 1 bit, bool, true if node is temporarry decompressed for usage.
 * attempted_compress: 1 bit, boolean, used for verifying during testing.
 * extra: 12 bits, free for future use; pads out the remainder of 32 bits */
typedef struct quicklistNode {
    struct quicklistNode *prev;
    struct quicklistNode *next;
    unsigned char *zl;
    unsigned int sz;             /* ziplist size in bytes */
    unsigned int count : 16;     /* count of items in ziplist */
    unsigned int encoding : 2;   /* RAW==1 or LZF==2 */
    unsigned int container : 2;  /* NONE==1 or ZIPLIST==2 */
    unsigned int recompress : 1; /* was this node previous compressed? */
    unsigned int attempted_compress : 1; /* node can't compress; too small */
    unsigned int extra : 10; /* more bits to steal for future usage */
} quicklistNode;

/* quicklistLZF is a 4+N byte struct holding 'sz' followed by 'compressed'.
 * 'sz' is byte length of 'compressed' field.
 * 'compressed' is LZF data with total (compressed) length 'sz'
 * NOTE: uncompressed length is stored in quicklistNode->sz.
 * When quicklistNode->zl is compressed, node->zl points to a quicklistLZF */
typedef struct quicklistLZF {
    unsigned int sz; /* LZF size in bytes*/
    char compressed[];
} quicklistLZF;

/* quicklist is a 32 byte struct (on 64-bit systems) describing a quicklist.
 * 'count' is the number of total entries.
 * 'len' is the number of quicklist nodes.
 * 'compress' is: -1 if compression disabled, otherwise it's the number
 *                of quicklistNodes to leave uncompressed at ends of quicklist.
 * 'fill' is the user-requested (or default) fill factor. */
typedef struct quicklist {
    quicklistNode *head;
    quicklistNode *tail;
    unsigned long count;        /* total count of all entries in all ziplists */
    unsigned int len;           /* number of quicklistNodes */
    int fill : 16;              /* fill factor for individual nodes */
    unsigned int compress : 16; /* depth of end nodes not to compress;0=off */
} quicklist;

typedef struct quicklistIter {
    const quicklist *quicklist;
    quicklistNode *current;
    unsigned char *zi;
    long offset; /* offset in current ziplist */
    int direction;
} quicklistIter;

typedef struct quicklistEntry {
    const quicklist *quicklist;
    quicklistNode *node;
    unsigned char *zi;
    unsigned char *value;
    unsigned int sz;
    long long longval;
    int offset;
} quicklistEntry;

#define QUICKLIST_HEAD 0
#define QUICKLIST_TAIL -1

/* quicklist node encodings */
#define QUICKLIST_NODE_ENCODING_RAW 1
#define QUICKLIST_NODE_ENCODING_LZF 2

/* quicklist compression disable */
#define QUICKLIST_NOCOMPRESS 0

/* quicklist container formats */
#define QUICKLIST_NODE_CONTAINER_NONE 1
#define QUICKLIST_NODE_CONTAINER_ZIPLIST 2

#define quicklistNodeIsCompressed(node)                                        \
    ((node)->encoding == QUICKLIST_NODE_ENCODING_LZF)

/* Prototypes */
quicklist *quicklistCreate(void);
quicklist *quicklistNew(int fill, int compress);
void quicklistSetCompressDepth(quicklist *quicklist, int depth);
void quicklistSetFill(quicklist *quicklist, int fill);
void quicklistSetOptions(quicklist *quicklist, int fill, int depth);
void quicklistRelease(quicklist *quicklist);
int quicklistPushHead(quicklist *quicklist, void *value, const size_t sz);
int quicklistPushTail(quicklist *quicklist, void *value, const size_t sz);
void quicklistPush(quicklist *quicklist, void *value, const size_t sz,
                   int where);
void quicklistAppendZiplist(quicklist *quicklist, unsigned char *zl);
quicklist *quicklistAppendValuesFromZiplist(quicklist *quicklist,
                                            unsigned char *zl);
quicklist *quicklistCreateFromZiplist(int fill, int compress,
                                      unsigned char *zl);
void quicklistInsertAfter(quicklist *quicklist, quicklistEntry *node,
                          void *value, const size_t sz);
void quicklistInsertBefore(quicklist *quicklist, quicklistEntry *node,
                           void *value, const size_t sz);
void quicklistDelEntry(quicklistIter *iter, quicklistEntry *entry);
int quicklistReplaceAtIndex(quicklist *quicklist, long index, void *data,
                            int sz);
int quicklistDelRange(quicklist *quicklist, const long start, const long stop);
quicklistIter *quicklistGetIterator(const quicklist *quicklist, int direction);
quicklistIter *quicklistGetIteratorAtIdx(const quicklist *quicklist,
                                         int direction, const long long idx);
int quicklistNext(quicklistIter *iter, quicklistEntry *node);
void quicklistReleaseIterator(quicklistIter *iter);
quicklist *quicklistDup(quicklist *orig);
int quicklistIndex(const quicklist *quicklist, const long long index,
                   quicklistEntry *entry);
void quicklistRewind(quicklist *quicklist, quicklistIter *li);
void quicklistRewindTail(quicklist *quicklist, quicklistIter *li);
void quicklistRotate(quicklist *quicklist);
int quicklistPopCustom(quicklist *quicklist, int where, unsigned char **data,
                       unsigned int *sz, long long *sval,
                       void *(*saver)(unsigned char *data, unsigned int sz));
int quicklistPop(quicklist *quicklist, int where, unsigned char **data,
                 unsigned int *sz, long long *slong);
unsigned int quicklistCount(quicklist *ql);
int quicklistCompare(unsigned char *p1, unsigned char *p2, int p2_len);
size_t quicklistGetLzf(const quicklistNode *node, void **data);

/* Directions for iterators */
#define AL_START_HEAD 0
#define AL_START_TAIL 1

#endif /* __QUICKLIST_H__ */


================================================
FILE: src/vr_rbtree.c
================================================
#include <vr_core.h>

void
rbtree_node_init(struct rbnode *node)
{
    node->left = NULL;
    node->right = NULL;
    node->parent = NULL;
    node->key = 0ULL;
    node->data = NULL;
    /* color is left uninitialized */
}

void
rbtree_init(struct rbtree *tree, struct rbnode *node)
{
    rbtree_node_init(node);
    rbtree_black(node);
    tree->root = node;
    tree->sentinel = node;
}

static struct rbnode *
rbtree_node_min(struct rbnode *node, struct rbnode *sentinel)
{
    /* traverse left links */

    while (node->left != sentinel) {
        node = node->left;
    }

    return node;
}

struct rbnode *
rbtree_min(struct rbtree *tree)
{
    struct rbnode *node = tree->root;
    struct rbnode *sentinel = tree->sentinel;

    /* empty tree */

    if (node == sentinel) {
        return NULL;
    }

    return rbtree_node_min(node, sentinel);
}

static void
rbtree_left_rotate(struct rbnode **root, struct rbnode *sentinel,
                   struct rbnode *node)
{
    struct rbnode *temp;

    temp = node->right;
    node->right = temp->left;

    if (temp->left != sentinel) {
        temp->left->parent = node;
    }

    temp->parent = node->parent;

    if (node == *root) {
        *root = temp;
    } else if (node == node->parent->left) {
        node->parent->left = temp;
    } else {
        node->parent->right = temp;
    }

    temp->left = node;
    node->parent = temp;
}

static void
rbtree_right_rotate(struct rbnode **root, struct rbnode *sentinel,
                    struct rbnode *node)
{
    struct rbnode *temp;

    temp = node->left;
    node->left = temp->right;

    if (temp->right != sentinel) {
        temp->right->parent = node;
    }

    temp->parent = node->parent;

    if (node == *root) {
        *root = temp;
    } else if (node == node->parent->right) {
        node->parent->right = temp;
    } else {
        node->parent->left = temp;
    }

    temp->right = node;
    node->parent = temp;
}

void
rbtree_insert(struct rbtree *tree, struct rbnode *node)
{
    struct rbnode **root = &tree->root;
    struct rbnode *sentinel = tree->sentinel;
    struct rbnode *temp, **p;

    /* empty tree */

    if (*root == sentinel) {
        node->parent = NULL;
        node->left = sentinel;
        node->right = sentinel;
        rbtree_black(node);
        *root = node;
        return;
    }

    /* a binary tree insert */

    temp = *root;
    for (;;) {

        p = (node->key < temp->key) ? &temp->left : &temp->right;
        if (*p == sentinel) {
            break;
        }
        temp = *p;
    }

    *p = node;
    node->parent = temp;
    node->left = sentinel;
    node->right = sentinel;
    rbtree_red(node);

    /* re-balance tree */

    while (node != *root && rbtree_is_red(node->parent)) {

        if (node->parent == node->parent->parent->left) {
            temp = node->parent->parent->right;

            if (rbtree_is_red(temp)) {
                rbtree_black(node->parent);
                rbtree_black(temp);
                rbtree_red(node->parent->parent);
                node = node->parent->parent;
            } else {
                if (node == node->parent->right) {
                    node = node->parent;
                    rbtree_left_rotate(root, sentinel, node);
                }

                rbtree_black(node->parent);
                rbtree_red(node->parent->parent);
                rbtree_right_rotate(root, sentinel, node->parent->parent);
            }
        } else {
            temp = node->parent->parent->left;

            if (rbtree_is_red(temp)) {
                rbtree_black(node->parent);
                rbtree_black(temp);
                rbtree_red(node->parent->parent);
                node = node->parent->parent;
            } else {
                if (node == node->parent->left) {
                    node = node->parent;
                    rbtree_right_rotate(root, sentinel, node);
                }

                rbtree_black(node->parent);
                rbtree_red(node->parent->parent);
                rbtree_left_rotate(root, sentinel, node->parent->parent);
            }
        }
    }

    rbtree_black(*root);
}

void
rbtree_delete(struct rbtree *tree, struct rbnode *node)
{
    struct rbnode **root = &tree->root;
    struct rbnode *sentinel = tree->sentinel;
    struct rbnode *subst, *temp, *w;
    uint8_t red;

    /* a binary tree delete */

    if (node->left == sentinel) {
        temp = node->right;
        subst = node;
    } else if (node->right == sentinel) {
        temp = node->left;
        subst = node;
    } else {
        subst = rbtree_node_min(node->right, sentinel);
        temp = subst->right;
    }

    if (subst == *root) {
        *root = temp;
        rbtree_black(temp);

        rbtree_node_init(node);

        return;
    }

    red = rbtree_is_red(subst);

    if (subst == subst->parent->left) {
        subst->parent->left = temp;
    } else {
        subst->parent->right = temp;
    }

    if (subst == node) {
        temp->parent = subst->parent;
    } else {

        if (subst->parent == node) {
            temp->parent = subst;
        } else {
            temp->parent = subst->parent;
        }

        subst->left = node->left;
        subst->right = node->right;
        subst->parent = node->parent;
        rbtree_copy_color(subst, node);

        if (node == *root) {
            *root = subst;
        } else {
            if (node == node->parent->left) {
                node->parent->left = subst;
            } else {
                node->parent->right = subst;
            }
        }

        if (subst->left != sentinel) {
            subst->left->parent = subst;
        }

        if (subst->right != sentinel) {
            subst->right->parent = subst;
        }
    }

    rbtree_node_init(node);

    if (red) {
        return;
    }

    /* a delete fixup */

    while (temp != *root && rbtree_is_black(temp)) {

        if (temp == temp->parent->left) {
            w = temp->parent->right;

            if (rbtree_is_red(w)) {
                rbtree_black(w);
                rbtree_red(temp->parent);
                rbtree_left_rotate(root, sentinel, temp->parent);
                w = temp->parent->right;
            }

            if (rbtree_is_black(w->left) && rbtree_is_black(w->right)) {
                rbtree_red(w);
                temp = temp->parent;
            } else {
                if (rbtree_is_black(w->right)) {
                    rbtree_black(w->left);
                    rbtree_red(w);
                    rbtree_right_rotate(root, sentinel, w);
                    w = temp->parent->right;
                }

                rbtree_copy_color(w, temp->parent);
                rbtree_black(temp->parent);
                rbtree_black(w->right);
                rbtree_left_rotate(root, sentinel, temp->parent);
                temp = *root;
            }

        } else {
            w = temp->parent->left;

            if (rbtree_is_red(w)) {
                rbtree_black(w);
                rbtree_red(temp->parent);
                rbtree_right_rotate(root, sentinel, temp->parent);
                w = temp->parent->left;
            }

            if (rbtree_is_black(w->left) && rbtree_is_black(w->right)) {
                rbtree_red(w);
                temp = temp->parent;
            } else {
                if (rbtree_is_black(w->left)) {
                    rbtree_black(w->right);
                    rbtree_red(w);
                    rbtree_left_rotate(root, sentinel, w);
                    w = temp->parent->left;
                }

                rbtree_copy_color(w, temp->parent);
                rbtree_black(temp->parent);
                rbtree_black(w->left);
                rbtree_right_rotate(root, sentinel, temp->parent);
                temp = *root;
            }
        }
    }

    rbtree_black(temp);
}


================================================
FILE: src/vr_rbtree.h
================================================
#ifndef _VR_RBTREE_
#define _VR_RBTREE_

#define rbtree_red(_node)           ((_node)->color = 1)
#define rbtree_black(_node)         ((_node)->color = 0)
#define rbtree_is_red(_node)        ((_node)->color)
#define rbtree_is_black(_node)      (!rbtree_is_red(_node))
#define rbtree_copy_color(_n1, _n2) ((_n1)->color = (_n2)->color)

struct rbnode {
    struct rbnode *left;     /* left link */
    struct rbnode *right;    /* right link */
    struct rbnode *parent;   /* parent link */
    int64_t       key;       /* key for ordering */
    void          *data;     /* opaque data */
    uint8_t       color;     /* red | black */
};

struct rbtree {
    struct rbnode *root;     /* root node */
    struct rbnode *sentinel; /* nil node */
};

void rbtree_node_init(struct rbnode *node);
void rbtree_init(struct rbtree *tree, struct rbnode *node);
struct rbnode *rbtree_min(struct rbtree *tree);
void rbtree_insert(struct rbtree *tree, struct rbnode *node);
void rbtree_delete(struct rbtree *tree, struct rbnode *node);

#endif


================================================
FILE: src/vr_rdb.c
================================================
#include <vr_core.h>

/* Save the DB on disk. Return C_ERR on error, C_OK on success. */
int rdbSave(char *filename) {
    return VR_OK;
}

void rdbRemoveTempFile(pid_t childpid) {
    char tmpfile[256];

    snprintf(tmpfile,sizeof(tmpfile),"temp-%d.rdb", (int) childpid);
    unlink(tmpfile);
}


================================================
FILE: src/vr_rdb.h
================================================
#ifndef _VR_RDB_H_
#define _VR_RDB_H_

/* Defines related to the dump file format. To store 32 bits lengths for short
 * keys requires a lot of space, so we check the most significant 2 bits of
 * the first byte to interpreter the length:
 *
 * 00|000000 => if the two MSB are 00 the len is the 6 bits of this byte
 * 01|000000 00000000 =>  01, the len is 14 byes, 6 bits + 8 bits of next byte
 * 10|000000 [32 bit integer] => if it's 10, a full 32 bit len will follow
 * 11|000000 this means: specially encoded object will follow. The six bits
 *           number specify the kind of object that follows.
 *           See the RDB_ENC_* defines.
 *
 * Lengths up to 63 are stored using a single byte, most DB keys, and may
 * values, will fit inside. */
#define RDB_6BITLEN 0
#define RDB_14BITLEN 1
#define RDB_32BITLEN 2
#define RDB_ENCVAL 3
#define RDB_LENERR UINT_MAX

/* When a length of a string object stored on disk has the first two bits
 * set, the remaining two bits specify a special encoding for the object
 * accordingly to the following defines: */
#define RDB_ENC_INT8 0        /* 8 bit signed integer */
#define RDB_ENC_INT16 1       /* 16 bit signed integer */
#define RDB_ENC_INT32 2       /* 32 bit signed integer */
#define RDB_ENC_LZF 3         /* string compressed with FASTLZ */

struct saveparam {
    time_t seconds;
    int changes;
};

int rdbSave(char *filename);
void rdbRemoveTempFile(pid_t childpid);

#endif


================================================
FILE: src/vr_replication.c
================================================
#include <vr_core.h>

struct vr_replication repl;

int vr_replication_init(void)
{
    vr_eventloop_init(&repl.vel,1000);

    repl.role = REPLICATION_ROLE_MASTER;
    repl.master = NULL;
    repl.cached_master = NULL;
    repl.slaves = NULL;
    repl.repl_no_slaves_since = 0;
    repl.repl_min_slaves_to_write = 0;
    repl.repl_min_slaves_max_lag = 0;
    repl.repl_good_slaves_count = 0;
    repl.repl_state = REPL_STATE_NONE;
    repl.repl_down_since = 0;

    /* Replication partial resync backlog */
    repl.repl_backlog = NULL;
    repl.repl_backlog_size = CONFIG_DEFAULT_REPL_BACKLOG_SIZE;
    repl.repl_backlog_histlen = 0;
    repl.repl_backlog_idx = 0;
    repl.repl_backlog_off = 0;
    repl.repl_backlog_time_limit = CONFIG_DEFAULT_REPL_BACKLOG_TIME_LIMIT;
    repl.repl_no_slaves_since = time(NULL);

    repl.slaves = dlistCreate();

    return VR_OK;
}

void vr_replication_deinit(void)
{
    vr_eventloop_deinit(&repl.vel);

    if (repl.master != NULL) {
        freeClient(repl.master);
        repl.master = NULL;
    }

    if (repl.cached_master != NULL) {
        freeClient(repl.cached_master);
        repl.cached_master = NULL;
    }

    if (repl.repl_backlog != NULL) {
        dfree(repl.repl_backlog);
        repl.repl_backlog = NULL;
    }

    if (repl.slaves != NULL) {
        client *slave;
        while (slave = dlistPop(repl.slaves)) {
            freeClient(slave);
        }
        dlistRelease(repl.slaves);
        repl.slaves = NULL;
    }
}

/* This is called by unblockClient() to perform the blocking op type
 * specific cleanup. We just remove the client from the list of clients
 * waiting for replica acks. Never call it directly, call unblockClient()
 * instead. */
void unblockClientWaitingReplicas(client *c) {
    dlistNode *ln = dlistSearchKey(c->vel->clients_waiting_acks,c);
    ASSERT(ln != NULL);
    dlistDelNode(c->vel->clients_waiting_acks,ln);
}

/* ------------------------- MIN-SLAVES-TO-WRITE  --------------------------- */

/* This function counts the number of slaves with lag <= min-slaves-max-lag.
 * If the option is active, the server will prevent writes if there are not
 * enough connected slaves with the specified lag (or less). */
void refreshGoodSlavesCount(void) {
    dlistIter li;
    dlistNode *ln;
    int good = 0;

    if (!repl.repl_min_slaves_to_write ||
        !repl.repl_min_slaves_max_lag) return;

    dlistRewind(repl.slaves,&li);
    while((ln = dlistNext(&li))) {
        client *slave = ln->value;
        time_t lag = repl.vel.unixtime - slave->repl_ack_time;

        if (slave->replstate == SLAVE_STATE_ONLINE &&
            lag <= repl.repl_min_slaves_max_lag) good++;
    }
    repl.repl_good_slaves_count = good;
}

/* This function is called when the slave lose the connection with the
 * master into an unexpected way. */
void replicationHandleMasterDisconnection(void) {
    repl.master = NULL;
    repl.repl_state = REPL_STATE_CONNECT;
    repl.repl_down_since = repl.vel.unixtime;
    /* We lost connection with our master, don't disconnect slaves yet,
     * maybe we'll be able to PSYNC with our master later. We'll disconnect
     * the slaves only if we'll have to do a full resync with our master. */
}


/* ---------------------- MASTER CACHING FOR PSYNC -------------------------- */

/* In order to implement partial synchronization we need to be able to cache
 * our master's client structure after a transient disconnection.
 * It is cached into server.cached_master and flushed away using the following
 * functions. */

/* This function is called by freeClient() in order to cache the master
 * client structure instead of destryoing it. freeClient() will return
 * ASAP after this function returns, so every action needed to avoid problems
 * with a client that is really "suspended" has to be done by this function.
 *
 * The other functions that will deal with the cached master are:
 *
 * replicationDiscardCachedMaster() that will make sure to kill the client
 * as for some reason we don't want to use it in the future.
 *
 * replicationResurrectCachedMaster() that is used after a successful PSYNC
 * handshake in order to reactivate the cached master.
 */
void replicationCacheMaster(client *c) {
    ASSERT(repl.master != NULL && repl.cached_master == NULL);
    log_debug(LOG_NOTICE,"Caching the disconnected master state.");

    /* Unlink the client from the server structures. */
    unlinkClient(c);

    /* Save the master. Server.master will be set to null later by
     * replicationHandleMasterDisconnection(). */
    repl.cached_master = repl.master;

    /* Invalidate the Peer ID cache. */
    if (c->peerid) {
        sdsfree(c->peerid);
        c->peerid = NULL;
    }

    /* Caching the master happens instead of the actual freeClient() call,
     * so make sure to adjust the replication state. This function will
     * also set server.master to NULL. */
    replicationHandleMasterDisconnection();
}

/* Return the pointer to a string representing the slave ip:listening_port
 * pair. Mostly useful for logging, since we want to log a slave using its
 * IP address and it's listening port which is more clear for the user, for
 * example: "Closing connection with slave 10.1.2.3:6380". */
char *replicationGetSlaveName(client *c) {
    static char buf[VR_INET_PEER_ID_LEN];
    char ip[VR_INET_ADDRSTRLEN];

    ip[0] = '\0';
    buf[0] = '\0';
    
    return buf;
}

/* REPLCONF <option> <value> <option> <value> ...
 * This command is used by a slave in order to configure the replication
 * process before starting it with the SYNC command.
 *
 * Currently the only use of this command is to communicate to the master
 * what is the listening port of the Slave redis instance, so that the
 * master can accurately list slaves and their listening ports in
 * the INFO output.
 *
 * In the future the same command can be used in order to configure
 * the replication to initiate an incremental replication instead of a
 * full resync. */
void replconfCommand(client *c) {
    int j;

    if ((c->argc % 2) == 0) {
        /* Number of arguments must be odd to make sure that every
         * option has a corresponding value. */
        addReply(c,shared.syntaxerr);
        return;
    }

    /* Process every option-value pair. */
    for (j = 1; j < c->argc; j+=2) {
        if (!strcasecmp(c->argv[j]->ptr,"listening-port")) {
            long port;

            if ((getLongFromObjectOrReply(c,c->argv[j+1],
                    &port,NULL) != VR_OK))
                return;
            c->slave_listening_port = port;
        } else if (!strcasecmp(c->argv[j]->ptr,"capa")) {
            /* Ignore capabilities not understood by this master. */
            if (!strcasecmp(c->argv[j+1]->ptr,"eof"))
                c->slave_capa |= SLAVE_CAPA_EOF;
        } else if (!strcasecmp(c->argv[j]->ptr,"ack")) {
            /* REPLCONF ACK is used by slave to inform the master the amount
             * of replication stream that it processed so far. It is an
             * internal only command that normal clients should never use. */
            long long offset;

            if (!(c->flags & CLIENT_SLAVE)) return;
            if ((getLongLongFromObject(c->argv[j+1], &offset) != VR_OK))
                return;
            if (offset > c->repl_ack_off)
                c->repl_ack_off = offset;
            c->repl_ack_time = c->vel->unixtime;
            /* If this was a diskless replication, we need to really put
             * the slave online when the first ACK is received (which
             * confirms slave is online and ready to get more data). */
            if (c->repl_put_online_on_ack && c->replstate == SLAVE_STATE_ONLINE)
                putSlaveOnline(c);
            /* Note: this command does not reply anything! */
            return;
        } else if (!strcasecmp(c->argv[j]->ptr,"getack")) {
            /* REPLCONF GETACK is used in order to request an ACK ASAP
             * to the slave. */
            if (repl.masterhost && repl.master) replicationSendAck();
            /* Note: this command does not reply anything! */
        } else {
            addReplyErrorFormat(c,"Unrecognized REPLCONF option: %s",
                (char*)c->argv[j]->ptr);
            return;
        }
    }
    addReply(c,shared.ok);
}

/* This function puts a slave in the online state, and should be called just
 * after a slave received the RDB file for the initial synchronization, and
 * we are finally ready to send the incremental stream of commands.
 *
 * It does a few things:
 *
 * 1) Put the slave in ONLINE state (useless when the function is called
 *    because state is already ONLINE but repl_put_online_on_ack is true).
 * 2) Make sure the writable event is re-installed, since calling the SYNC
 *    command disables it, so that we can accumulate output buffer without
 *    sending it to the slave.
 * 3) Update the count of good slaves. */
void putSlaveOnline(client *slave) {
    slave->replstate = SLAVE_STATE_ONLINE;
    slave->repl_put_online_on_ack = 0;
    slave->repl_ack_time = slave->vel->unixtime; /* Prevent false timeout. */
    if (aeCreateFileEvent(slave->vel->el, slave->conn->sd, AE_WRITABLE,
        sendReplyToClient, slave) == AE_ERR) {
        log_warn("unable to register writable event for slave bulk transfer: %s", strerror(errno));
        freeClient(slave);
        return;
    }
    refreshGoodSlavesCount();
    log_debug(LOG_NOTICE,"Synchronization with slave %s succeeded",
        replicationGetSlaveName(slave));
}

/* Send a REPLCONF ACK command to the master to inform it about the current
 * processed offset. If we are not connected with a master, the command has
 * no effects. */
void replicationSendAck(void) {
    client *c = repl.master;

    if (c != NULL) {
        c->flags |= CLIENT_MASTER_FORCE_REPLY;
        addReplyMultiBulkLen(c,3);
        addReplyBulkCString(c,"REPLCONF");
        addReplyBulkCString(c,"ACK");
        addReplyBulkLongLong(c,c->reploff);
        c->flags &= ~CLIENT_MASTER_FORCE_REPLY;
    }
}

void replicationFeedMonitors(client *c, dlist *monitors, int dictid, robj **argv, int argc) {
    dlistNode *ln;
    dlistIter li;
    int j;
    sds cmdrepr = sdsnew("+");
    robj *cmdobj;
    struct timeval tv;

    gettimeofday(&tv,NULL);
    cmdrepr = sdscatprintf(cmdrepr,"%ld.%06ld ",(long)tv.tv_sec,(long)tv.tv_usec);
    if (c->flags & CLIENT_LUA) {
        cmdrepr = sdscatprintf(cmdrepr,"[%d lua] ",dictid);
    } else if (c->flags & CLIENT_UNIX_SOCKET) {
        cmdrepr = sdscatprintf(cmdrepr,"[%d unix:%s] ",dictid,server.unixsocket);
    } else {
        cmdrepr = sdscatprintf(cmdrepr,"[%d %s] ",dictid,getClientPeerId(c));
    }

    for (j = 0; j < argc; j++) {
        if (argv[j]->encoding == OBJ_ENCODING_INT) {
            cmdrepr = sdscatprintf(cmdrepr, "\"%ld\"", (long)argv[j]->ptr);
        } else {
            cmdrepr = sdscatrepr(cmdrepr,(char*)argv[j]->ptr,
                        sdslen(argv[j]->ptr));
        }
        if (j != argc-1)
            cmdrepr = sdscatlen(cmdrepr," ",1);
    }
    cmdrepr = sdscatlen(cmdrepr,"\r\n",2);
    cmdobj = createObject(OBJ_STRING,cmdrepr);

    dlistRewind(monitors,&li);
    while((ln = dlistNext(&li))) {
        client *monitor = ln->value;
        addReply(monitor,cmdobj);
    }
    decrRefCount(cmdobj);
}

/* Add data to the replication backlog.
 * This function also increments the global replication offset stored at
 * server.master_repl_offset, because there is no case where we want to feed
 * the backlog without incrementing the buffer. */
void feedReplicationBacklog(void *ptr, size_t len) {
    unsigned char *p = ptr;

    repl.master_repl_offset += len;

    /* This is a circular buffer, so write as much data we can at every
     * iteration and rewind the "idx" index if we reach the limit. */
    while(len) {
        size_t thislen = repl.repl_backlog_size - repl.repl_backlog_idx;
        if (thislen > len) thislen = len;
        memcpy(repl.repl_backlog+repl.repl_backlog_idx,p,thislen);
        repl.repl_backlog_idx += thislen;
        if (repl.repl_backlog_idx == repl.repl_backlog_size)
            repl.repl_backlog_idx = 0;
        len -= thislen;
        p += thislen;
        repl.repl_backlog_histlen += thislen;
    }
    if (repl.repl_backlog_histlen > repl.repl_backlog_size)
        repl.repl_backlog_histlen = repl.repl_backlog_size;
    /* Set the offset of the first byte we have in the backlog. */
    repl.repl_backlog_off = repl.master_repl_offset -
                              repl.repl_backlog_histlen + 1;
}

/* Wrapper for feedReplicationBacklog() that takes Redis string objects
 * as input. */
void feedReplicationBacklogWithObject(robj *o) {
    char llstr[LONG_STR_SIZE];
    void *p;
    size_t len;

    if (o->encoding == OBJ_ENCODING_INT) {
        len = ll2string(llstr,sizeof(llstr),(long)o->ptr);
        p = llstr;
    } else {
        len = sdslen(o->ptr);
        p = o->ptr;
    }
    feedReplicationBacklog(p,len);
}

void replicationFeedSlaves(dlist *slaves, int dictid, robj **argv, int argc) {
    dlistNode *ln;
    dlistIter li;
    int j, len;
    char llstr[LONG_STR_SIZE];

    /* If there aren't slaves, and there is no backlog buffer to populate,
     * we can return ASAP. */
    if (repl.repl_backlog == NULL && dlistLength(slaves) == 0) return;

    /* We can't have slaves attached and no backlog. */
    ASSERT(!(dlistLength(slaves) != 0 && repl.repl_backlog == NULL));

    /* Send SELECT command to every slave if needed. */
    if (repl.slaveseldb != dictid) {
        robj *selectcmd;

        /* For a few DBs we have pre-computed SELECT command. */
        if (dictid >= 0 && dictid < PROTO_SHARED_SELECT_CMDS) {
            selectcmd = shared.select[dictid];
        } else {
            int dictid_len;

            dictid_len = ll2string(llstr,sizeof(llstr),dictid);
            selectcmd = createObject(OBJ_STRING,
                sdscatprintf(sdsempty(),
                "*2\r\n$6\r\nSELECT\r\n$%d\r\n%s\r\n",
                dictid_len, llstr));
        }

        /* Add the SELECT command into the backlog. */
        if (repl.repl_backlog) feedReplicationBacklogWithObject(selectcmd);

        /* Send it to slaves. */
        dlistRewind(slaves,&li);
        while((ln = dlistNext(&li))) {
            client *slave = ln->value;
            if (slave->replstate == SLAVE_STATE_WAIT_BGSAVE_START) continue;
            addReply(slave,selectcmd);
        }

        if (dictid < 0 || dictid >= PROTO_SHARED_SELECT_CMDS)
            decrRefCount(selectcmd);
    }
    repl.slaveseldb = dictid;

    /* Write the command to the replication backlog if any. */
    if (repl.repl_backlog) {
        char aux[LONG_STR_SIZE+3];

        /* Add the multi bulk reply length. */
        aux[0] = '*';
        len = ll2string(aux+1,sizeof(aux)-1,argc);
        aux[len+1] = '\r';
        aux[len+2] = '\n';
        feedReplicationBacklog(aux,len+3);

        for (j = 0; j < argc; j++) {
            long objlen = stringObjectLen(argv[j]);

            /* We need to feed the buffer with the object as a bulk reply
             * not just as a plain string, so create the $..CRLF payload len
             * and add the final CRLF */
            aux[0] = '$';
            len = ll2string(aux+1,sizeof(aux)-1,objlen);
            aux[len+1] = '\r';
            aux[len+2] = '\n';
            feedReplicationBacklog(aux,len+3);
            feedReplicationBacklogWithObject(argv[j]);
            feedReplicationBacklog(aux+len+1,2);
        }
    }

    /* Write the command to every slave. */
    dlistRewind(repl.slaves,&li);
    while((ln = dlistNext(&li))) {
        client *slave = ln->value;

        /* Don't feed slaves that are still waiting for BGSAVE to start */
        if (slave->replstate == SLAVE_STATE_WAIT_BGSAVE_START) continue;

        /* Feed slaves that are waiting for the initial SYNC (so these commands
         * are queued in the output buffer until the initial SYNC completes),
         * or are already in sync with the master. */

        /* Add the multi bulk length. */
        addReplyMultiBulkLen(slave,argc);

        /* Finally any additional argument that was not stored inside the
         * static buffer if any (from j to argc). */
        for (j = 0; j < argc; j++)
            addReplyBulk(slave,argv[j]);
    }
}


================================================
FILE: src/vr_replication.h
================================================
#ifndef _VR_REPLICATION_H_
#define _VR_REPLICATION_H_

/* Slave replication state. Used in server.repl_state for slaves to remember
 * what to do next. */
#define REPL_STATE_NONE 0 /* No active replication */
#define REPL_STATE_CONNECT 1 /* Must connect to master */
#define REPL_STATE_CONNECTING 2 /* Connecting to master */
/* --- Handshake states, must be ordered --- */
#define REPL_STATE_RECEIVE_PONG 3 /* Wait for PING reply */
#define REPL_STATE_SEND_AUTH 4 /* Send AUTH to master */
#define REPL_STATE_RECEIVE_AUTH 5 /* Wait for AUTH reply */
#define REPL_STATE_SEND_PORT 6 /* Send REPLCONF listening-port */
#define REPL_STATE_RECEIVE_PORT 7 /* Wait for REPLCONF reply */
#define REPL_STATE_SEND_CAPA 8 /* Send REPLCONF capa */
#define REPL_STATE_RECEIVE_CAPA 9 /* Wait for REPLCONF reply */
#define REPL_STATE_SEND_PSYNC 10 /* Send PSYNC */
#define REPL_STATE_RECEIVE_PSYNC 11 /* Wait for PSYNC reply */
/* --- End of handshake states --- */
#define REPL_STATE_TRANSFER 12 /* Receiving .rdb from master */
#define REPL_STATE_CONNECTED 13 /* Connected to master */

/* State of slaves from the POV of the master. Used in client->replstate.
 * In SEND_BULK and ONLINE state the slave receives new updates
 * in its output queue. In the WAIT_BGSAVE states instead the server is waiting
 * to start the next background saving in order to send updates to it. */
#define SLAVE_STATE_WAIT_BGSAVE_START 6 /* We need to produce a new RDB file. */
#define SLAVE_STATE_WAIT_BGSAVE_END 7 /* Waiting RDB file creation to finish. */
#define SLAVE_STATE_SEND_BULK 8 /* Sending RDB file to slave. */
#define SLAVE_STATE_ONLINE 9 /* RDB file transmitted, sending just updates. */

/* Slave capabilities. */
#define SLAVE_CAPA_NONE 0
#define SLAVE_CAPA_EOF (1<<0)   /* Can parse the RDB EOF streaming format. */

/* Synchronous read timeout - slave side */
#define CONFIG_REPL_SYNCIO_TIMEOUT 5

#define REPLICATION_ROLE_MASTER 0
#define REPLICATION_ROLE_SLAVE  1

#define CONFIG_DEFAULT_REPL_BACKLOG_SIZE (1024*1024)    /* 1mb */
#define CONFIG_DEFAULT_REPL_BACKLOG_TIME_LIMIT (60*60)  /* 1 hour */
#define CONFIG_REPL_BACKLOG_MIN_SIZE (1024*16)          /* 16k */

struct vr_replication {
    vr_eventloop vel;

    int role;               /* Master/slave? */

    /* Replication (master) */
    dlist *slaves;           /* List of slaves */
    int slaveseldb;                 /* Last SELECTed DB in replication output */
    long long master_repl_offset;   /* Global replication offset */
    int repl_ping_slave_period;     /* Master pings the slave every N seconds */
    char *repl_backlog;             /* Replication backlog for partial syncs */
    long long repl_backlog_size;    /* Backlog circular buffer size */
    long long repl_backlog_histlen; /* Backlog actual data length */
    long long repl_backlog_idx;     /* Backlog circular buffer current offset */
    long long repl_backlog_off;     /* Replication offset of first byte in the
                                       backlog buffer. */
    time_t repl_backlog_time_limit; /* Time without slaves after the backlog
                                       gets released. */
    time_t repl_no_slaves_since;    /* We have no slaves since that time.
                                       Only valid if server.slaves len is 0. */
    int repl_min_slaves_to_write;   /* Min number of slaves to write. */
    int repl_min_slaves_max_lag;    /* Max lag of <count> slaves to write. */
    int repl_good_slaves_count;     /* Number of slaves with lag <= max_lag. */
    int repl_diskless_sync;         /* Send RDB to slaves sockets directly. */
    int repl_diskless_sync_delay;   /* Delay to start a diskless repl BGSAVE. */

    /* Replication (slave) */
    char *masterauth;               /* AUTH with this password with master */
    char *masterhost;               /* Hostname of master */
    int masterport;                 /* Port of master */
    int repl_timeout;               /* Timeout after N seconds of master idle */
    client *master;     /* Client that is master for this slave */
    client *cached_master; /* Cached master to be reused for PSYNC. */
    int repl_syncio_timeout; /* Timeout for synchronous I/O calls */
    int repl_state;          /* Replication status if the instance is a slave */
    off_t repl_transfer_size; /* Size of RDB to read from master during sync. */
    off_t repl_transfer_read; /* Amount of RDB read from master during sync. */
    off_t repl_transfer_last_fsync_off; /* Offset when we fsync-ed last time. */
    int repl_transfer_s;     /* Slave -> Master SYNC socket */
    int repl_transfer_fd;    /* Slave -> Master SYNC temp file descriptor */
    char *repl_transfer_tmpfile; /* Slave-> master SYNC temp file name */
    time_t repl_transfer_lastio; /* Unix time of the latest read, for timeout */
    int repl_serve_stale_data; /* Serve stale data when link is down? */
    int repl_slave_ro;          /* Slave is read only? */
    time_t repl_down_since; /* Unix time at which link with master went down */
    int repl_disable_tcp_nodelay;   /* Disable TCP_NODELAY after SYNC? */
    int slave_priority;             /* Reported in INFO and used by Sentinel. */
    char repl_master_runid[CONFIG_RUN_ID_SIZE+1];  /* Master run id for PSYNC. */
    long long repl_master_initial_offset;         /* Master PSYNC offset. */
};

extern struct vr_replication repl;

int vr_replication_init(void);
void vr_replication_deinit(void);

void unblockClientWaitingReplicas(client *c);
void refreshGoodSlavesCount(void);
void replicationHandleMasterDisconnection(void);
void replicationCacheMaster(client *c);
char *replicationGetSlaveName(client *c);
void replconfCommand(client *c);
void putSlaveOnline(client *slave);
void replicationSendAck(void);
void replicationFeedMonitors(client *c, dlist *monitors, int dictid, robj **argv, int argc);
void replicationFeedSlaves(dlist *slaves, int dictid, robj **argv, int argc);
void feedReplicationBacklogWithObject(robj *o);
void feedReplicationBacklog(void *ptr, size_t len);

#endif


================================================
FILE: src/vr_scripting.c
================================================
#include <vr_core.h>

void scriptCommand(client *c) {
    addReply(c,shared.ok);
}


================================================
FILE: src/vr_scripting.h
================================================
#ifndef _VR_SCRIPTING_H_
#define _VR_SCRIPTING_H_

void scriptCommand(client *c);

#endif


================================================
FILE: src/vr_server.c
================================================
#include <sys/utsname.h>

#include <vr_core.h>

/* Global vars */
struct vr_server server; /* server global state */

/* Our shared "common" objects */
struct sharedObjectsStruct shared;

unsigned int
dictStrHash(const void *key) {
    return dictGenHashFunction((unsigned char*)key, strlen((char*)key));
}

unsigned int
dictStrCaseHash(const void *key) {
    return dictGenCaseHashFunction((unsigned char*)key, strlen((char*)key));
}

unsigned int
dictSdsHash(const void *key) {
    return dictGenHashFunction((unsigned char*)key, sdslen((char*)key));
}

unsigned int
dictSdsCaseHash(const void *key) {
    return dictGenCaseHashFunction((unsigned char*)key, sdslen((char*)key));
}

int
dictStrKeyCompare(void *privdata, const void *key1,
        const void *key2)
{
    int l1,l2;
    DICT_NOTUSED(privdata);

    l1 = strlen((char*)key1);
    l2 = strlen((char*)key2);
    if (l1 != l2) return 0;
    return memcmp(key1, key2, l1) == 0;
}

/* A case insensitive version used for the config option lookup table and other
 * places where case insensitive non binary-safe comparison is needed. */
int
dictStrKeyCaseCompare(void *privdata, const void *key1,
        const void *key2)
{
    DICT_NOTUSED(privdata);

    return strcasecmp(key1, key2) == 0;
}

int
dictSdsKeyCompare(void *privdata, const void *key1,
        const void *key2)
{
    int l1,l2;
    DICT_NOTUSED(privdata);

    l1 = sdslen((sds)key1);
    l2 = sdslen((sds)key2);
    if (l1 != l2) return 0;
    return memcmp(key1, key2, l1) == 0;
}

/* A case insensitive version used for the command lookup table and other
 * places where case insensitive non binary-safe comparison is needed. */
int
dictSdsKeyCaseCompare(void *privdata, const void *key1,
        const void *key2)
{
    DICT_NOTUSED(privdata);

    return strcasecmp(key1, key2) == 0;
}

void *
dictSdsKeyDupFromStr(void *privdata, const void *key)
{
    DICT_NOTUSED(privdata);

    return sdsnew(key); /* key is c string */
}

void
dictSdsDestructor(void *privdata, void *val)
{
    DICT_NOTUSED(privdata);

    sdsfree(val);
}

void
dictObjectDestructor(void *privdata, void *val)
{
    DICT_NOTUSED(privdata);

    if (val == NULL) return; /* Values of swapped out keys as set to NULL */
    freeObject(val);
}

int
dictEncObjKeyCompare(void *privdata, const void *key1,
        const void *key2)
{
    robj *o1 = (robj*) key1, *o2 = (robj*) key2;
    robj *o1_new, *o2_new;
    int cmp;

    if (o1->encoding == OBJ_ENCODING_INT &&
        o2->encoding == OBJ_ENCODING_INT)
            return o1->ptr == o2->ptr;

    o1_new = getDecodedObject(o1);
    o2_new = getDecodedObject(o2);
    cmp = dictSdsKeyCompare(privdata,o1_new->ptr,o2_new->ptr);
    if (o1_new != o1)  freeObject(o1_new);
    if (o2_new != o2)  freeObject(o2_new);
    return cmp;
}

unsigned int
dictEncObjHash(const void *key) {
    robj *o = (robj*) key;

    if (sdsEncodedObject(o)) {
        return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
    } else {
        if (o->encoding == OBJ_ENCODING_INT) {
            char buf[32];
            int len;

            len = ll2string(buf,32,(long)o->ptr);
            return dictGenHashFunction((unsigned char*)buf, len);
        } else {
            unsigned int hash;
            robj *o_new;

            o_new = getDecodedObject(o);
            hash = dictGenHashFunction(o_new->ptr, sdslen((sds)o_new->ptr));
            if (o_new!= o) freeObject(o_new);
            return hash;
        }
    }
}

unsigned int
dictObjHash(const void *key) {
    const robj *o = key;
    return dictGenHashFunction(o->ptr, sdslen((sds)o->ptr));
}

int
dictObjKeyCompare(void *privdata, const void *key1,
        const void *key2)
{
    const robj *o1 = key1, *o2 = key2;
    return dictSdsKeyCompare(privdata,o1->ptr,o2->ptr);
}

void
dictListDestructor(void *privdata, void *val)
{
    DICT_NOTUSED(privdata);
    dlistRelease((dlist*)val);
}

/* Hash type hash table (note that small hashes are represented with ziplists) */
dictType hashDictType = {
    dictEncObjHash,             /* hash function */
    NULL,                       /* key dup */
    NULL,                       /* val dup */
    dictEncObjKeyCompare,       /* key compare */
    dictObjectDestructor,  /* key destructor */
    dictObjectDestructor   /* val destructor */
};

/* Sets type hash table */
dictType setDictType = {
    dictEncObjHash,            /* hash function */
    NULL,                      /* key dup */
    NULL,                      /* val dup */
    dictEncObjKeyCompare,      /* key compare */
    dictObjectDestructor, /* key destructor */
    NULL                       /* val destructor */
};

/* Sorted sets hash (note: a skiplist is used in addition to the hash table) */
dictType zsetDictType = {
    dictEncObjHash,            /* hash function */
    NULL,                      /* key dup */
    NULL,                      /* val dup */
    dictEncObjKeyCompare,      /* key compare */
    dictObjectDestructor,      /* key destructor */
    NULL                       /* val destructor */
};

/* =========================== Server initialization ======================== */

static void createSharedObjects(void) {
    int j;
    robj **obj;

    shared.crlf = createObject(OBJ_STRING,sdsnew("\r\n"));
    shared.ok = createObject(OBJ_STRING,sdsnew("+OK\r\n"));
    shared.err = createObject(OBJ_STRING,sdsnew("-ERR\r\n"));
    shared.emptybulk = createObject(OBJ_STRING,sdsnew("$0\r\n\r\n"));
    shared.czero = createObject(OBJ_STRING,sdsnew(":0\r\n"));
    shared.cone = createObject(OBJ_STRING,sdsnew(":1\r\n"));
    shared.cnegone = createObject(OBJ_STRING,sdsnew(":-1\r\n"));
    shared.nullbulk = createObject(OBJ_STRING,sdsnew("$-1\r\n"));
    shared.nullmultibulk = createObject(OBJ_STRING,sdsnew("*-1\r\n"));
    shared.emptymultibulk = createObject(OBJ_STRING,sdsnew("*0\r\n"));
    shared.pong = createObject(OBJ_STRING,sdsnew("+PONG\r\n"));
    shared.queued = createObject(OBJ_STRING,sdsnew("+QUEUED\r\n"));
    shared.emptyscan = createObject(OBJ_STRING,sdsnew("*2\r\n$1\r\n0\r\n*0\r\n"));
    shared.wrongtypeerr = createObject(OBJ_STRING,sdsnew(
        "-WRONGTYPE Operation against a key holding the wrong kind of value\r\n"));
    shared.nokeyerr = createObject(OBJ_STRING,sdsnew(
        "-ERR no such key\r\n"));
    shared.syntaxerr = createObject(OBJ_STRING,sdsnew(
        "-ERR syntax error\r\n"));
    shared.sameobjecterr = createObject(OBJ_STRING,sdsnew(
        "-ERR source and destination objects are the same\r\n"));
    shared.outofrangeerr = createObject(OBJ_STRING,sdsnew(
        "-ERR index out of range\r\n"));
    shared.noscripterr = createObject(OBJ_STRING,sdsnew(
        "-NOSCRIPT No matching script. Please use EVAL.\r\n"));
    shared.loadingerr = createObject(OBJ_STRING,sdsnew(
        "-LOADING Redis is loading the dataset in memory\r\n"));
    shared.slowscripterr = createObject(OBJ_STRING,sdsnew(
        "-BUSY Redis is busy running a script. You can only call SCRIPT KILL or SHUTDOWN NOSAVE.\r\n"));
    shared.masterdownerr = createObject(OBJ_STRING,sdsnew(
        "-MASTERDOWN Link with MASTER is down and slave-serve-stale-data is set to 'no'.\r\n"));
    shared.bgsaveerr = createObject(OBJ_STRING,sdsnew(
        "-MISCONF Redis is configured to save RDB snapshots, but is currently not able to persist on disk. Commands that may modify the data set are disabled. Please check Redis logs for details about the error.\r\n"));
    shared.roslaveerr = createObject(OBJ_STRING,sdsnew(
        "-READONLY You can't write against a read only slave.\r\n"));
    shared.noautherr = createObject(OBJ_STRING,sdsnew(
        "-NOAUTH Authentication required.\r\n"));
    shared.noadminerr = createObject(OBJ_STRING,sdsnew(
        "-NOADMIN Authentication required.\r\n"));
    shared.oomerr = createObject(OBJ_STRING,sdsnew(
        "-OOM command not allowed when used memory > 'maxmemory'.\r\n"));
    shared.execaborterr = createObject(OBJ_STRING,sdsnew(
        "-EXECABORT Transaction discarded because of previous errors.\r\n"));
    shared.noreplicaserr = createObject(OBJ_STRING,sdsnew(
        "-NOREPLICAS Not enough good slaves to write.\r\n"));
    shared.busykeyerr = createObject(OBJ_STRING,sdsnew(
        "-BUSYKEY Target key name already exists.\r\n"));
    shared.space = createObject(OBJ_STRING,sdsnew(" "));
    shared.colon = createObject(OBJ_STRING,sdsnew(":"));
    shared.plus = createObject(OBJ_STRING,sdsnew("+"));

    for (j = 0; j < PROTO_SHARED_SELECT_CMDS; j++) {
        char dictid_str[64];
        int dictid_len;

        dictid_len = ll2string(dictid_str,sizeof(dictid_str),j);
        shared.select[j] = createObject(OBJ_STRING,
            sdscatprintf(sdsempty(),
                "*2\r\n$6\r\nSELECT\r\n$%d\r\n%s\r\n",
                dictid_len, dictid_str));
    }
    shared.messagebulk = createStringObject("$7\r\nmessage\r\n",13);
    shared.pmessagebulk = createStringObject("$8\r\npmessage\r\n",14);
    shared.subscribebulk = createStringObject("$9\r\nsubscribe\r\n",15);
    shared.unsubscribebulk = createStringObject("$11\r\nunsubscribe\r\n",18);
    shared.psubscribebulk = createStringObject("$10\r\npsubscribe\r\n",17);
    shared.punsubscribebulk = createStringObject("$12\r\npunsubscribe\r\n",19);
    shared.del = createStringObject("DEL",3);
    shared.rpop = createStringObject("RPOP",4);
    shared.lpop = createStringObject("LPOP",4);
    shared.lpush = createStringObject("LPUSH",5);
    for (j = 0; j < OBJ_SHARED_INTEGERS; j++) {
        shared.integers[j] = createObject(OBJ_STRING,(void*)(long)j);
        shared.integers[j]->encoding = OBJ_ENCODING_INT;
    }
    for (j = 0; j < OBJ_SHARED_BULKHDR_LEN; j++) {
        shared.mbulkhdr[j] = createObject(OBJ_STRING,
            sdscatprintf(sdsempty(),"*%d\r\n",j));
        shared.bulkhdr[j] = createObject(OBJ_STRING,
            sdscatprintf(sdsempty(),"$%d\r\n",j));
    }
    /* The following two shared objects, minstring and maxstrings, are not
     * actually used for their value but as a special object meaning
     * respectively the minimum possible string and the maximum possible
     * string in string comparisons for the ZRANGEBYLEX command. */
    shared.minstring = createStringObject("minstring",9);
    shared.maxstring = createStringObject("maxstring",9);

    shared.outofcomplexitylimit = createObject(OBJ_STRING,sdsnew(
        "-ERR Out of max time complexity limit.\r\n"));

    /* Set this objects to constant */
    for (obj = &shared; *obj != NULL; obj ++) {
        (*obj)->constant = 1;
    }
}

int
init_server(struct instance *nci)
{
    int ret;
    uint32_t i;
    redisDb *db;
    
    server.pid = getpid();
    server.arch_bits = (sizeof(long) == 8) ? 64 : 32;
    server.starttime = time(NULL);
    get_random_hex_chars(server.runid, CONFIG_RUN_ID_SIZE);

    server.commands = dictCreate(&commandTableDictType,NULL);
    populateCommandTable();
    server.delCommand = lookupCommandByCString("del");
    server.multiCommand = lookupCommandByCString("multi");
    server.lpushCommand = lookupCommandByCString("lpush");
    server.lpopCommand = lookupCommandByCString("lpop");
    server.rpopCommand = lookupCommandByCString("rpop");
    server.sremCommand = lookupCommandByCString("srem");
    server.execCommand = lookupCommandByCString("exec");

    conf = conf_create(nci->conf_filename);

    ret = populateCommandsNeedAdminpass();
    if (ret != VR_OK) {
        log_error("Populate need adminpass commands failed");
        return VR_ERROR;
    }

    server.configfile = getAbsolutePath(nci->conf_filename);
    server.hz = 10;
    server.dblnum = cserver->databases;
    server.dbinum = cserver->internal_dbs_per_databases;
    server.dbnum = server.dblnum*server.dbinum;
    darray_init(&server.dbs, server.dbnum, sizeof(redisDb));
    server.pidfile = nci->pid_filename;
    server.executable = NULL;
    server.activerehashing = CONFIG_DEFAULT_ACTIVE_REHASHING;
    
    server.client_max_querybuf_len = PROTO_MAX_QUERYBUF_LEN;

    for (i = 0; i < server.dbnum; i ++) {
        db = darray_push(&server.dbs);
        redisDbInit(db);
    }

    server.clients = dlistCreate();
    
    server.monitors = dlistCreate();

    server.loading = 0;

    server.lua_timedout = 0;

    server.aof_state = AOF_OFF;

    server.stop_writes_on_bgsave_err = 0;

    server.ready_keys = dlistCreate();

    server.system_memory_size = dalloc_get_memory_size();

    server.rdb_child_pid = -1;
    server.aof_child_pid = -1;

    server.hash_max_ziplist_entries = OBJ_HASH_MAX_ZIPLIST_ENTRIES;
    server.hash_max_ziplist_value = OBJ_HASH_MAX_ZIPLIST_VALUE;
    server.list_max_ziplist_size = OBJ_LIST_MAX_ZIPLIST_SIZE;
    server.list_compress_depth = OBJ_LIST_COMPRESS_DEPTH;
    server.set_max_intset_entries = OBJ_SET_MAX_INTSET_ENTRIES;
    server.zset_max_ziplist_entries = OBJ_ZSET_MAX_ZIPLIST_ENTRIES;
    server.zset_max_ziplist_value = OBJ_ZSET_MAX_ZIPLIST_VALUE;
    server.hll_sparse_max_bytes = CONFIG_DEFAULT_HLL_SPARSE_MAX_BYTES;

    server.notify_keyspace_events = 0;

    slowlogInit();
    vr_replication_init();
    
    createSharedObjects();

    server.port = cserver->port;
    
    /* Init worker first */
    ret = workers_init(nci->thread_num);
    if (ret != VR_OK) {
        log_error("Init worker threads failed");
        return VR_ERROR;
    }

    /* Init master after worker init */
    ret = master_init(conf);
    if (ret != VR_OK) {
        log_error("Init master thread failed");
        return VR_ERROR;
    }

    ret = backends_init(1);
    if (ret != VR_OK) {
        log_error("Init backend threads failed");
        return VR_ERROR;
    }

    log_debug(LOG_NOTICE, "memory alloc lock type: %s", malloc_lock_type());
    log_debug(LOG_NOTICE, "malloc lib: %s", DMALLOC_LIB);

    log_debug(LOG_NOTICE, "stats lock type: %s", STATS_LOCK_TYPE);

    return VR_OK;
}

unsigned int getLRUClock(void) {
    return (vr_msec_now()/LRU_CLOCK_RESOLUTION) & LRU_CLOCK_MAX;
}

/* This is an helper function for freeMemoryIfNeeded(), it is used in order
 * to populate the evictionPool with a few entries every time we want to
 * expire a key. Keys with idle time smaller than one of the current
 * keys are added. Keys are always added if there are free entries.
 *
 * We insert keys on place in ascending order, so keys with the smaller
 * idle time are on the left, and keys with the higher idle time on the
 * right. */

#define EVICTION_SAMPLES_ARRAY_SIZE 16
void evictionPoolPopulate(dict *sampledict, dict *keydict, 
    struct evictionPoolEntry *pool, int maxmemory_samples) {
    int j, k, count;
    dictEntry *_samples[EVICTION_SAMPLES_ARRAY_SIZE];
    dictEntry **samples;

    /* Try to use a static buffer: this function is a big hit...
     * Note: it was actually measured that this helps. */
    if (maxmemory_samples <= EVICTION_SAMPLES_ARRAY_SIZE) {
        samples = _samples;
    } else {
        samples = dalloc(sizeof(samples[0])*maxmemory_samples);
    }

    count = dictGetSomeKeys(sampledict,samples,maxmemory_samples);
    for (j = 0; j < count; j++) {
        unsigned long long idle;
        sds key;
        robj *o;
        dictEntry *de;

        de = samples[j];
        key = dictGetKey(de);
        /* If the dictionary we are sampling from is not the main
         * dictionary (but the expires one) we need to lookup the key
         * again in the key dictionary to obtain the value object. */
        if (sampledict != keydict) de = dictFind(keydict, key);
        o = dictGetVal(de);
        idle = estimateObjectIdleTime(o);

        /* Insert the element inside the pool.
         * First, find the first empty bucket or the first populated
         * bucket that has an idle time smaller than our idle time. */
        k = 0;
        while (k < MAXMEMORY_EVICTION_POOL_SIZE &&
               pool[k].key &&
               pool[k].idle < idle) k++;
        if (k == 0 && pool[MAXMEMORY_EVICTION_POOL_SIZE-1].key != NULL) {
            /* Can't insert if the element is < the worst element we have
             * and there are no empty buckets. */
            continue;
        } else if (k < MAXMEMORY_EVICTION_POOL_SIZE && pool[k].key == NULL) {
            /* Inserting into empty position. No setup needed before insert. */
        } else {
            /* Inserting in the middle. Now k points to the first element
             * greater than the element to insert.  */
            if (pool[MAXMEMORY_EVICTION_POOL_SIZE-1].key == NULL) {
                /* Free space on the right? Insert at k shifting
                 * all the elements from k to end to the right. */
                memmove(pool+k+1,pool+k,
                    sizeof(pool[0])*(MAXMEMORY_EVICTION_POOL_SIZE-k-1));
            } else {
                /* No free space on right? Insert at k-1 */
                k--;
                /* Shift all elements on the left of k (included) to the
                 * left, so we discard the element with smaller idle time. */
                sdsfree(pool[0].key);
                memmove(pool,pool+1,sizeof(pool[0])*k);
            }
        }
        pool[k].key = sdsdup(key);
        pool[k].idle = idle;
    }
    if (samples != _samples) dfree(samples);
}

int freeMemoryIfNeeded(vr_eventloop *vel) {
    size_t mem_used, mem_tofree, mem_freed;
    mstime_t latency, eviction_latency;
    int keys_freed = 0;
    long long maxmemory;
    int maxmemory_policy, maxmemory_samples;
    int ret;

    maxmemory = vel->cc.maxmemory;
    if (dalloc_used_memory() <= maxmemory)
        return VR_OK;

    conf_server_get(CONFIG_SOPN_MAXMEMORYP, &maxmemory_policy);
    if (maxmemory_policy == MAXMEMORY_NO_EVICTION)
        return VR_ERROR; /* We need to free memory, but policy forbids. */

    conf_server_get(CONFIG_SOPN_MAXMEMORYS, &maxmemory_samples);
    while (1) {
        int j, k;

        for (j = 0; j < server.dbnum; j++) {
            long bestval = 0; /* just to prevent warning */
            sds bestkey = NULL;
            dictEntry *de;
            redisDb *db = darray_get(&server.dbs, j);
            dict *dict;

            lockDbWrite(db);
            if (maxmemory_policy == MAXMEMORY_ALLKEYS_LRU ||
                maxmemory_policy == MAXMEMORY_ALLKEYS_RANDOM)
            {
                dict = db->dict;
            } else {
                dict = db->expires;
            }
            if (dictSize(dict) == 0) {
                unlockDb(db);
                continue;
            }

            /* volatile-random and allkeys-random policy */
            if (maxmemory_policy == MAXMEMORY_ALLKEYS_RANDOM ||
                maxmemory_policy == MAXMEMORY_VOLATILE_RANDOM)
            {
                de = dictGetRandomKey(dict);
                bestkey = dictGetKey(de);
            }

            /* volatile-lru and allkeys-lru policy */
            else if (maxmemory_policy == MAXMEMORY_ALLKEYS_LRU ||
                maxmemory_policy == MAXMEMORY_VOLATILE_LRU)
            {
                struct evictionPoolEntry *pool = db->eviction_pool;

                while(bestkey == NULL) {
                    evictionPoolPopulate(dict, db->dict, db->eviction_pool, maxmemory_samples);
                    /* Go backward from best to worst element to evict. */
                    for (k = MAXMEMORY_EVICTION_POOL_SIZE-1; k >= 0; k--) {
                        if (pool[k].key == NULL) continue;
                        de = dictFind(dict,pool[k].key);

                        /* Remove the entry from the pool. */
                        sdsfree(pool[k].key);
                        /* Shift all elements on its right to left. */
                        memmove(pool+k,pool+k+1,
                            sizeof(pool[0])*(MAXMEMORY_EVICTION_POOL_SIZE-k-1));
                        /* Clear the element on the right which is empty
                         * since we shifted one position to the left.  */
                        pool[MAXMEMORY_EVICTION_POOL_SIZE-1].key = NULL;
                        pool[MAXMEMORY_EVICTION_POOL_SIZE-1].idle = 0;

                        /* If the key exists, is our pick. Otherwise it is
                         * a ghost and we need to try the next element. */
                        if (de) {
                            bestkey = dictGetKey(de);
                            break;
                        } else {
                            /* Ghost... */
                            continue;
                        }
                    }
                }
            }

            /* volatile-ttl */
            else if (maxmemory_policy == MAXMEMORY_VOLATILE_TTL) {
                for (k = 0; k < maxmemory_samples; k++) {
                    sds thiskey;
                    long thisval;

                    de = dictGetRandomKey(dict);
                    thiskey = dictGetKey(de);
                    thisval = (long) dictGetVal(de);

                    /* Expire sooner (minor expire unix timestamp) is better
                     * candidate for deletion */
                    if (bestkey == NULL || thisval < bestval) {
                        bestkey = thiskey;
                        bestval = thisval;
                    }
                }
            }

            /* Finally remove the selected key. */
            if (bestkey) {
                robj *keyobj = createStringObject(bestkey,sdslen(bestkey));
                dbDelete(db,keyobj);
                freeObject(keyobj);
                keys_freed++;
            }
            
            unlockDb(db);

            conf_server_get(CONFIG_SOPN_MAXMEMORY, &maxmemory);
            if (dalloc_used_memory() <= maxmemory) {
                goto stop;
            }
        }
        
        if (!keys_freed) {
            return VR_ERROR; /* nothing to free... */
        }

        update_stats_add(vel->stats, evictedkeys, keys_freed);
        keys_freed = 0;
    }

stop:
    update_stats_add(vel->stats, evictedkeys, keys_freed);
    return VR_OK;
}

/* The PING command. It works in a different way if the client is in
 * in Pub/Sub mode. */
void pingCommand(client *c) {
    /* The command takes zero or one arguments. */
    if (c->argc > 2) {
        addReplyErrorFormat(c,"wrong number of arguments for '%s' command",
            c->cmd->name);
        return;
    }

    if (c->flags & CLIENT_PUBSUB) {
        addReply(c,shared.mbulkhdr[2]);
        addReplyBulkCBuffer(c,"pong",4);
        if (c->argc == 1)
            addReplyBulkCBuffer(c,"",0);
        else
            addReplyBulk(c,c->argv[1]);
    } else {
        if (c->argc == 1)
            addReply(c,shared.pong);
        else
            addReplyBulk(c,c->argv[1]);
    }
}

/* Return zero if strings are the same, non-zero if they are not.
 * The comparison is performed in a way that prevents an attacker to obtain
 * information about the nature of the strings just monitoring the execution
 * time of the function.
 *
 * Note that limiting the comparison length to strings up to 512 bytes we
 * can avoid leaking any information about the password length and any
 * possible branch misprediction related leak.
 */
int time_independent_strcmp(char *a, char *b) {
    char bufa[CONFIG_AUTHPASS_MAX_LEN], bufb[CONFIG_AUTHPASS_MAX_LEN];
    /* The above two strlen perform len(a) + len(b) operations where either
     * a or b are fixed (our password) length, and the difference is only
     * relative to the length of the user provided string, so no information
     * leak is possible in the following two lines of code. */
    unsigned int alen = strlen(a);
    unsigned int blen = strlen(b);
    unsigned int j;
    int diff = 0;

    /* We can't compare strings longer than our static buffers.
     * Note that this will never pass the first test in practical circumstances
     * so there is no info leak. */
    if (alen > sizeof(bufa) || blen > sizeof(bufb)) return 1;

    memset(bufa,0,sizeof(bufa));        /* Constant time. */
    memset(bufb,0,sizeof(bufb));        /* Constant time. */
    /* Again the time of the following two copies is proportional to
     * len(a) + len(b) so no info is leaked. */
    memcpy(bufa,a,alen);
    memcpy(bufb,b,blen);

    /* Always compare all the chars in the two buffers without
     * conditional expressions. */
    for (j = 0; j < sizeof(bufa); j++) {
        diff |= (bufa[j] ^ bufb[j]);
    }
    /* Length must be equal as well. */
    diff |= alen ^ blen;
    return diff; /* If zero strings are the same. */
}

void authCommand(client *c) {
    sds requirepass;

    conf_server_get(CONFIG_SOPN_REQUIREPASS,&requirepass);
    if (!requirepass) {
        addReplyError(c,"Client sent AUTH, but no password is set");
        return;
    } else if (!time_independent_strcmp(c->argv[1]->ptr, requirepass)) {
        if (!c->authenticated)
            c->authenticated = 1;
        addReply(c,shared.ok);
    } else {
        c->authenticated = 0;
        addReplyError(c,"invalid password");
    }
    sdsfree(requirepass);
}

void adminCommand(client *c) {
    sds adminpass;

    conf_server_get(CONFIG_SOPN_ADMINPASS,&adminpass);
    if (!adminpass) {
        addReplyError(c,"Client sent ADMIN, but no password is set");
        return;
    } else if (!time_independent_strcmp(c->argv[1]->ptr, adminpass)) {
        c->authenticated = 2;
        addReply(c,shared.ok);
    } else {
        c->authenticated = 0;
        addReplyError(c,"invalid password");
    }
    sdsfree(adminpass);
}

int htNeedsResize(dict *dict) {
    long long size, used;

    size = dictSlots(dict);
    used = dictSize(dict);
    return (size && used && size > DICT_HT_INITIAL_SIZE &&
            (used*100/size < HASHTABLE_MIN_FILL));
}

struct keys_statistics {
    long long keys_all;
    long long vkeys_all;
    long long avg_ttl_all;
    int nexist;
};

/* Create the string returned by the INFO command. This is decoupled
 * by the INFO command itself as we need to report the same information
 * on memory corruption problems. */
sds genVireInfoString(vr_eventloop *vel, char *section) {
    sds info = sdsempty();
    time_t uptime = time(NULL)-server.starttime;
    int j, k, numcommands;
    struct rusage self_ru;
    unsigned long lol, bib;
    int allsections = 0, defsections = 0;
    int sections = 0;
    struct darray *kss = NULL;  /* type: keys_statistics */

    if (section == NULL) section = "default";
    allsections = strcasecmp(section,"all") == 0;
    defsections = strcasecmp(section,"default") == 0;

    getrusage(RUSAGE_SELF, &self_ru);

    /* Server */
    if (allsections || defsections || !strcasecmp(section,"server")) {
        static int call_uname = 1;
        static struct utsname name;
        char *mode;

        mode = "standalone";

        if (sections++) info = sdscat(info,"\r\n");

        if (call_uname) {
            /* Uname can be slow and is always the same output. Cache it. */
            uname(&name);
            call_uname = 0;
        }

        info = sdscatprintf(info,
            "# Server\r\n"
            "vire_version:%s\r\n"
            "vire_mode:%s\r\n"
            "os:%s %s %s\r\n"
            "arch_bits:%d\r\n"
            "multiplexing_api:%s\r\n"
            "gcc_version:%d.%d.%d\r\n"
            "process_id:%ld\r\n"
            "run_id:%s\r\n"
            "tcp_port:%d\r\n"
            "uptime_in_seconds:%jd\r\n"
            "uptime_in_days:%jd\r\n"
            "hz:%d\r\n"
            "executable:%s\r\n"
            "config_file:%s\r\n"
            "databases:%d\r\n"
            "internal_databases:%d\r\n",
            VR_VERSION_STRING,
            mode,
            name.sysname, name.release, name.machine,
            server.arch_bits,
            aeGetApiName(),
#ifdef __GNUC__
            __GNUC__,__GNUC_MINOR__,__GNUC_PATCHLEVEL__,
#else
            0,0,0,
#endif
            (long) getpid(),
            server.runid,
            server.port,
            (intmax_t)uptime,
            (intmax_t)(uptime/(3600*24)),
            server.hz,
            server.executable ? server.executable : "",
            server.configfile ? server.configfile : "",
            server.dblnum,
            server.dbinum);
    }

    /* Clients */
    if (allsections || defsections || !strcasecmp(section,"clients")) {
        if (sections++) info = sdscat(info,"\r\n");
        info = sdscatprintf(info,
            "# Clients\r\n"
            "connected_clients:%d\r\n",
            current_clients());
    }

    /* Memory */
    if (allsections || defsections || !strcasecmp(section,"memory")) {
        uint32_t idx;
        vr_worker *worker;
        char hmem[64];
        char peak_hmem[64];
        char total_system_hmem[64];
        char used_memory_lua_hmem[64];
        char used_memory_rss_hmem[64];
        char maxmemory_hmem[64];
        size_t vr_used_memory = dalloc_used_memory();
        size_t total_system_mem = server.system_memory_size;
        const char *evict_policy;
        size_t peak_memory = 0, peak_memory_for_one_worker;
        long long maxmemory;
        int maxmemory_policy;

        /* Peak memory is updated from time to time by workerCron() so it
         * may happen that the instantaneous value is slightly bigger than
         * the peak value. This may confuse users, so we update the peak
         * if found smaller than the current memory usage. */
        for (idx = 0; idx < darray_n(&workers); idx ++) {
            worker = darray_get(&workers, idx);
            update_stats_get(worker->vel.stats, peak_memory, 
                &peak_memory_for_one_worker);
            if (peak_memory < peak_memory_for_one_worker)
                peak_memory = peak_memory_for_one_worker;
        }
        if (vr_used_memory > peak_memory) {
            peak_memory = vr_used_memory;
            update_stats_set(vel->stats, peak_memory, vr_used_memory);
        }

        conf_server_get(CONFIG_SOPN_MAXMEMORY,&maxmemory);
        conf_server_get(CONFIG_SOPN_MAXMEMORYP,&maxmemory_policy);
        evict_policy = get_evictpolicy_strings(maxmemory_policy);
    
        bytesToHuman(hmem,vr_used_memory);
        bytesToHuman(peak_hmem,peak_memory);
        bytesToHuman(total_system_hmem,total_system_mem);
        bytesToHuman(used_memory_rss_hmem,vel->resident_set_size);
        bytesToHuman(maxmemory_hmem,maxmemory);

        if (sections++) info = sdscat(info,"\r\n");
        info = sdscatprintf(info,
            "# Memory\r\n"
            "used_memory:%zu\r\n"
            "used_memory_human:%s\r\n"
            "used_memory_rss:%zu\r\n"
            "used_memory_rss_human:%s\r\n"
            "used_memory_peak:%zu\r\n"
            "used_memory_peak_human:%s\r\n"
            "total_system_memory:%lu\r\n"
            "total_system_memory_human:%s\r\n"
            "maxmemory:%lld\r\n"
            "maxmemory_human:%s\r\n"
            "maxmemory_policy:%s\r\n"
            "mem_fragmentation_ratio:%.2f\r\n"
            "mem_allocator:%s\r\n",
            vr_used_memory,
            hmem,
            vel->resident_set_size,
            used_memory_rss_hmem,
            peak_memory,
            peak_hmem,
            (unsigned long)total_system_mem,
            total_system_hmem,
            maxmemory,
            maxmemory_hmem,
            evict_policy,
            (float)vel->resident_set_size/vr_used_memory,
            DMALLOC_LIB
            );
    }

    /* Stats */
    if (allsections || defsections || !strcasecmp(section,"stats")) {
        uint32_t idx;
        vr_stats *stats;
        long long stat_numconnections=0, stat_numcommands=0;
        long long stat_net_input_bytes=0, stat_net_output_bytes=0;
        long long stat_rejected_conn=0;
        long long stat_expiredkeys=0;
        long long stat_evictedkeys=0;
        long long stat_keyspace_hits=0, stat_keyspace_misses=0;
        long long stat_numcommands_ops=0;
        float stat_net_input_bytes_ops=0, stat_net_output_bytes_ops=0;

        for (idx = 0; idx < darray_n(&workers); idx ++) {
            long long stats_value;
            vr_worker *worker = darray_get(&workers, idx);
            stats = worker->vel.stats;

            update_stats_get(stats, numcommands, &stats_value);
            stat_numcommands += stats_value;
            update_stats_get(stats, numconnections, &stats_value);
            stat_numconnections += stats_value;
            update_stats_get(stats, expiredkeys, &stats_value);
            stat_expiredkeys += stats_value;
            update_stats_get(stats, evictedkeys, &stats_value);
            stat_evictedkeys += stats_value;
            update_stats_get(stats, net_input_bytes, &stats_value);
            stat_net_input_bytes += stats_value;
            update_stats_get(stats, net_output_bytes, &stats_value);
            stat_net_output_bytes += stats_value;
            update_stats_get(stats, keyspace_hits, &stats_value);
            stat_keyspace_hits += stats_value;
            update_stats_get(stats, keyspace_misses, &stats_value);
            stat_keyspace_misses += stats_value;
            
            stat_numcommands_ops += getInstantaneousMetric(stats, STATS_METRIC_COMMAND);
            stat_net_input_bytes_ops += (float)getInstantaneousMetric(stats, STATS_METRIC_NET_INPUT)/1024;
            stat_net_output_bytes_ops += (float)getInstantaneousMetric(stats, STATS_METRIC_NET_OUTPUT)/1024;
        }
        for (idx = 0; idx < darray_n(&backends); idx ++) {
            long long stats_value;
            vr_backend *backend = darray_get(&backends, idx);
            stats = backend->vel.stats;

            update_stats_get(stats, expiredkeys, &stats_value);
            stat_expiredkeys += stats_value;
        }
        update_stats_get(master.vel.stats, rejected_conn, &stat_rejected_conn);
        
        if (sections++) info = sdscat(info,"\r\n");
        info = sdscatprintf(info,
            "# Stats\r\n"
            "total_connections_received:%lld\r\n"
            "total_commands_processed:%lld\r\n"
            "instantaneous_ops_per_sec:%lld\r\n"
            "total_net_input_bytes:%lld\r\n"
            "total_net_output_bytes:%lld\r\n"
            "instantaneous_input_kbps:%.2f\r\n"
            "instantaneous_output_kbps:%.2f\r\n"
            "rejected_connections:%lld\r\n"
            "expired_keys:%lld\r\n"
            "evicted_keys:%lld\r\n"
            "keyspace_hits:%lld\r\n"
            "keyspace_misses:%lld\r\n",
            stat_numconnections,
            stat_numcommands,
            stat_numcommands_ops,
            stat_net_input_bytes,
            stat_net_output_bytes,
            stat_net_input_bytes_ops,
            stat_net_output_bytes_ops,
            stat_rejected_conn,
            stat_expiredkeys,
            stat_evictedkeys,
            stat_keyspace_hits,
            stat_keyspace_misses);
    }

    /* CPU */
    if (allsections || defsections || !strcasecmp(section,"cpu")) {
        if (sections++) info = sdscat(info,"\r\n");
        info = sdscatprintf(info,
        "# CPU\r\n"
        "used_cpu_sys:%.2f\r\n"
        "used_cpu_user:%.2f\r\n",
        (float)self_ru.ru_stime.tv_sec+(float)self_ru.ru_stime.tv_usec/1000000,
        (float)self_ru.ru_utime.tv_sec+(float)self_ru.ru_utime.tv_usec/1000000);
    }
    
    /* Internal */
    if (allsections || !strcasecmp(section,"internal")) {
        redisDb *db;
        struct keys_statistics *ks;
        long long keys, vkeys, avg_ttl;
        
        kss = darray_create(server.dblnum, sizeof(struct keys_statistics));
        
        if (sections++) info = sdscat(info,"\r\n");
        info = sdscatprintf(info, "# Internal\r\n");
        for (j = 0; j < server.dblnum; j++) {
            ks = darray_push(kss);
            ks->keys_all = ks->vkeys_all = ks->avg_ttl_all = 0;
            ks->nexist = 0;
            for (k = 0; k < server.dbinum; k ++) {
                db = darray_get(&server.dbs, (uint32_t)(j*server.dbinum+k));
                lockDbRead(db);
                keys = dictSize(db->dict);
                vkeys = dictSize(db->expires);
                avg_ttl = db->avg_ttl;
                unlockDb(db);
                if (keys || vkeys) {
                    info = sdscatprintf(info,
                        "db%d-%d:keys=%lld,expires=%lld,avg_ttl=%lld\r\n",
                        j, k, keys, vkeys, db->avg_ttl);
                }
                ks->keys_all += keys;
                ks->vkeys_all += vkeys;
                ks->avg_ttl_all += avg_ttl;
                if (avg_ttl > 0) ks->nexist ++;
            }
        }
    }

    /* Key space */
    if (allsections || defsections || !strcasecmp(section,"keyspace")) {
        redisDb *db;
        struct keys_statistics *ks;
        long long keys_all, vkeys_all, avg_ttl_all;
        int nexist;
        
        if (sections++) info = sdscat(info,"\r\n");
        info = sdscatprintf(info, "# Keyspace\r\n");
        if (kss == NULL) {
            for (j = 0; j < server.dblnum; j++) {
                keys_all = vkeys_all = avg_ttl_all = 0;
                nexist = 0;
                for (k = 0; k < server.dbinum; k ++) {
                    db = darray_get(&server.dbs, (uint32_t)(j*server.dbinum+k));
                    lockDbRead(db);
                    keys_all += dictSize(db->dict);
                    vkeys_all += dictSize(db->expires);
                    avg_ttl_all += db->avg_ttl;
                    if (db->avg_ttl > 0) nexist ++;
                    unlockDb(db);
                }
                if (keys_all || vkeys_all) {
                    info = sdscatprintf(info,
                        "db%d:keys=%lld,expires=%lld,avg_ttl=%lld\r\n",
                        j, keys_all, vkeys_all, nexist>0?(avg_ttl_all/nexist):0);
                }
            }
        } else {
            for (j = 0; j < server.dblnum; j ++) {
                ks = darray_get(kss, j);
                if (ks->keys_all || ks->vkeys_all) {
                    info = sdscatprintf(info,
                        "db%d:keys=%lld,expires=%lld,avg_ttl=%lld\r\n",
                        j, ks->keys_all, ks->vkeys_all, 
                        ks->nexist>0?(ks->avg_ttl_all/ks->nexist):0);
                }
            }
        }
    }

    if (kss != NULL) {
        kss->nelem = 0;
        darray_destroy(kss);
        kss = NULL;
    }

    return info;
}

void infoCommand(client *c) {
    char *section = c->argc == 2 ? c->argv[1]->ptr : "default";

    if (c->argc > 2) {
        addReply(c,shared.syntaxerr);
        return;
    }
    addReplyBulkSds(c, genVireInfoString(c->vel, section));
}

void echoCommand(client *c) {
    addReplyBulk(c,c->argv[1]);
}

void timeCommand(client *c) {
    struct timeval tv;

    /* gettimeofday() can only fail if &tv is a bad address so we
     * don't check for errors. */
    gettimeofday(&tv,NULL);
    addReplyMultiBulkLen(c,2);
    addReplyBulkLongLong(c,tv.tv_sec);
    addReplyBulkLongLong(c,tv.tv_usec);
}

/* This function will try to raise the max number of open files accordingly to
 * the configured max number of clients. It also reserves a number of file
 * descriptors (CONFIG_MIN_RESERVED_FDS) for extra operations of
 * persistence, listening sockets, log files and so forth.
 *
 * If it will not be possible to set the limit accordingly to the configured
 * max number of clients, the function will do the reverse setting
 * server.maxclients to the value that we can actually handle. */
int adjustOpenFilesLimit(int maxclients) {
    rlim_t maxfiles, finallimit = 0;
    rlim_t oldlimit;
    int finalmaxclients;
    struct rlimit limit;
    int threads;

    conf_server_get(CONFIG_SOPN_THREADS,&threads);
    maxfiles = maxclients+threads*2+CONFIG_MIN_RESERVED_FDS;
    if (getrlimit(RLIMIT_NOFILE,&limit) == -1) {
        log_warn("Unable to obtain the current NOFILE limit (%s), assuming 1024 and setting the max clients configuration accordingly.",
            strerror(errno));
        oldlimit = 1024;
        finallimit = oldlimit;
    } else {
        oldlimit = limit.rlim_cur;

        /* Set the max number of files if the current limit is not enough
         * for our needs. */
        if (oldlimit < maxfiles) {
            rlim_t bestlimit;
            int setrlimit_error = 0;

            /* Try to set the file limit to match 'maxfiles' or at least
             * to the higher value supported less than maxfiles. */
            bestlimit = maxfiles;
            while(bestlimit > oldlimit) {
                rlim_t decr_step = 16;

                limit.rlim_cur = bestlimit;
                limit.rlim_max = bestlimit;
                if (setrlimit(RLIMIT_NOFILE,&limit) != -1) break;
                setrlimit_error = errno;

                /* We failed to set file limit to 'bestlimit'. Try with a
                 * smaller limit decrementing by a few FDs per iteration. */
                if (bestlimit < decr_step) break;
                bestlimit -= decr_step;
            }

            /* Assume that the limit we get initially is still valid if
             * our last try was even lower. */
            if (bestlimit < oldlimit) bestlimit = oldlimit;

            finallimit = bestlimit;
            if (bestlimit < maxfiles) {
                log_warn("You requested maxclients of %d "
                    "requiring at least %llu max file descriptors.",
                    maxclients,
                    (unsigned long long) maxfiles);
                log_warn("Server can't set maximum open files "
                    "to %llu because of OS error: %s.",
                    (unsigned long long) maxfiles, strerror(setrlimit_error));
                log_warn("Current maximum open files is %llu. ",
                    (unsigned long long) bestlimit);
            } else {
                log_warn("Increased maximum number of open files "
                    "to %llu (it was originally set to %llu).",
                    (unsigned long long) maxfiles,
                    (unsigned long long) oldlimit);
            }
        } else {
            finallimit = maxfiles;
        }
    }

    finalmaxclients = finallimit-threads*2-CONFIG_MIN_RESERVED_FDS;
    if (finalmaxclients < 1) {
        log_warn("Your current 'ulimit -n' "
            "of %llu is not enough for the server to start. "
            "Please increase your open file limit to at least "
            "%llu. Exiting.",
            (unsigned long long) oldlimit,
            (unsigned long long) maxfiles);
        return -1;
    }
    
    if (finallimit < maxfiles) {
        conf_value *cv = conf_value_create(CONF_VALUE_TYPE_STRING);
        cv->value = sdsfromlonglong((long long)finalmaxclients);
        conf_server_set(CONFIG_SOPN_MAXCLIENTS,cv);
        conf_value_destroy(cv);
        log_warn("maxclients has been reduced to %d to compensate for "
            "low ulimit. "
            "If you need higher maxclients increase 'ulimit -n'.",
            finalmaxclients);
    }
    
    return (int)finallimit;
}


================================================
FILE: src/vr_server.h
================================================
#ifndef _VR_SERVER_H_
#define _VR_SERVER_H_

#define CONFIG_MIN_RESERVED_FDS 32 /* For extra operations of
                                            * listening sockets, log files and so forth*/

#define CONFIG_AUTHPASS_MAX_LEN 512
#define PROTO_SHARED_SELECT_CMDS 10
#define CRON_DBS_PER_CALL 16

#define ACTIVE_EXPIRE_CYCLE_LOOKUPS_PER_LOOP 20 /* Loopkups per loop. */
#define ACTIVE_EXPIRE_CYCLE_FAST_DURATION 1000 /* Microseconds */
#define ACTIVE_EXPIRE_CYCLE_SLOW_TIME_PERC 25 /* CPU max % for keys collection */
#define ACTIVE_EXPIRE_CYCLE_SLOW 0
#define ACTIVE_EXPIRE_CYCLE_FAST 1

#define SCAN_TYPE_KEY   0
#define SCAN_TYPE_HASH  1
#define SCAN_TYPE_SET   2
#define SCAN_TYPE_ZSET  3

/* Redis maxmemory strategies */
#define CONFIG_DEFAULT_MAXMEMORY_POLICY MAXMEMORY_NO_EVICTION

/* Zip structure related defaults */
#define OBJ_HASH_MAX_ZIPLIST_ENTRIES 512
#define OBJ_HASH_MAX_ZIPLIST_VALUE 64
#define OBJ_SET_MAX_INTSET_ENTRIES 512
#define OBJ_ZSET_MAX_ZIPLIST_ENTRIES 128
#define OBJ_ZSET_MAX_ZIPLIST_VALUE 64

/* List defaults */
#define OBJ_LIST_MAX_ZIPLIST_SIZE -2
#define OBJ_LIST_COMPRESS_DEPTH 0

/* HyperLogLog defines */
#define CONFIG_DEFAULT_HLL_SPARSE_MAX_BYTES 3000

/* List related stuff */
#define LIST_HEAD 0
#define LIST_TAIL 1

#define ZSKIPLIST_MAXLEVEL 32 /* Should be enough for 2^32 elements */
#define ZSKIPLIST_P 0.25      /* Skiplist P = 1/4 */

/* Units */
#define UNIT_SECONDS 0
#define UNIT_MILLISECONDS 1

/* Hash table parameters */
#define HASHTABLE_MIN_FILL        10      /* Minimal hash table fill 10% */

/* Using the following macro you can run code inside serverCron() with the
 * specified period, specified in milliseconds.
 * The actual resolution depends on server.hz. */
#define run_with_period(_ms_, cronloops) if ((_ms_ <= 1000/server.hz) || !(cronloops%((_ms_)/(1000/server.hz))))

/* Macro used to obtain the current LRU clock.
 * If the current resolution is lower than the frequency we refresh the
 * LRU clock (as it should be in production servers) we return the
 * precomputed value, otherwise we need to resort to a function call. */
#define LRU_CLOCK() ((1000/server.hz <= LRU_CLOCK_RESOLUTION) ? server.lruclock : getLRUClock())

/* The following structure represents a node in the server.ready_keys list,
 * where we accumulate all the keys that had clients blocked with a blocking
 * operation such as B[LR]POP, but received new data in the context of the
 * last executed command.
 *
 * After the execution of every command or script, we run this list to check
 * if as a result we should serve data to clients blocked, unblocking them.
 * Note that server.ready_keys will not have duplicates as there dictionary
 * also called ready_keys in every structure representing a Redis database,
 * where we make sure to remember if a given key was already added in the
 * server.ready_keys list. */
typedef struct readyList {
    redisDb *db;
    robj *key;
} readyList;

struct vr_server {
    aeEventLoop *el;
    dlist *clients;
    
    /* General */
    pid_t pid;                  /* Main process pid. */
    char *executable;           /* Absolute executable file path. */
    char *configfile;           /* Absolute config file path, or NULL */
    int hz;                     /* serverCron() calls frequency in hertz */

    struct darray dbs;           /* database array, type: redisDB */
    int dbnum;                  /* Total number of DBs */
    int dblnum;                 /* Logical number of configured DBs */
    int dbinum;                 /* Number of internal DBs for per logical DB */
    
    dict *commands;             /* Command table */
    dict *orig_commands;        /* Command table before command renaming. */
    
    unsigned lruclock:LRU_BITS; /* Clock for LRU eviction */
    int activerehashing;        /* Incremental rehash in serverCron() */

    char *pidfile;              /* PID file path */
    int arch_bits;              /* 32 or 64 depending on sizeof(long) */
    char runid[CONFIG_RUN_ID_SIZE+1];  /* ID always different at every exec. */
    
    /* Networking */
    int port;                   /* TCP listening port */
    int tcp_backlog;            /* TCP listen() backlog */

    int tcpkeepalive;               /* Set SO_KEEPALIVE if non-zero. */
    size_t client_max_querybuf_len; /* Limit for client query buffer length */

    /* Zip structure config, see redis.conf for more information  */
    size_t hash_max_ziplist_entries;
    size_t hash_max_ziplist_value;
    size_t set_max_intset_entries;
    size_t zset_max_ziplist_entries;
    size_t zset_max_ziplist_value;
    size_t hll_sparse_max_bytes;
    /* List parameters */
    int list_max_ziplist_size;
    int list_compress_depth;
    
    clientBufferLimitsConfig client_obuf_limits[CLIENT_TYPE_OBUF_COUNT];

    dlist *monitors;    /* List of slaves and MONITORs */

    time_t starttime;       /* Server start time */

    /* time cache */
    time_t unixtime;        /* Unix time sampled every cron cycle. */
    long long mstime;       /* Like 'unixtime' but with milliseconds resolution. */

    char *unixsocket;           /* UNIX socket path */

    /* RDB / AOF loading information */
    int loading;                /* We are loading data from disk if true */
    off_t loading_total_bytes;
    off_t loading_loaded_bytes;
    time_t loading_start_time;
    off_t loading_process_events_interval_bytes;

    /* AOF persistence */
    int aof_state;                  /* AOF_(ON|OFF|WAIT_REWRITE) */
    int aof_fsync;                  /* Kind of fsync() policy */
    char *aof_filename;             /* Name of the AOF file */
    int aof_no_fsync_on_rewrite;    /* Don't fsync if a rewrite is in prog. */
    int aof_rewrite_perc;           /* Rewrite AOF if % growth is > M and... */
    off_t aof_rewrite_min_size;     /* the AOF file is at least N bytes. */
    off_t aof_rewrite_base_size;    /* AOF size on latest startup or rewrite. */
    off_t aof_current_size;         /* AOF current size. */
    int aof_rewrite_scheduled;      /* Rewrite once BGSAVE terminates. */
    pid_t aof_child_pid;            /* PID if rewriting process */
    dlist *aof_rewrite_buf_blocks;   /* Hold changes during an AOF rewrite. */
    sds aof_buf;      /* AOF buffer, written before entering the event loop */
    int aof_fd;       /* File descriptor of currently selected AOF file */
    int aof_selected_db; /* Currently selected DB in AOF */
    time_t aof_flush_postponed_start; /* UNIX time of postponed AOF flush */
    time_t aof_last_fsync;            /* UNIX time of last fsync() */
    time_t aof_rewrite_time_last;   /* Time used by last AOF rewrite run. */
    time_t aof_rewrite_time_start;  /* Current AOF rewrite start time. */
    int aof_lastbgrewrite_status;   /* VR_OK or VR_ERROR */
    unsigned long aof_delayed_fsync;  /* delayed AOF fsync() counter */
    int aof_rewrite_incremental_fsync;/* fsync incrementally while rewriting? */
    int aof_last_write_status;      /* VR_OK or VR_ERROR */
    int aof_last_write_errno;       /* Valid if aof_last_write_status is ERR */
    int aof_load_truncated;         /* Don't stop on unexpected AOF EOF. */
    /* AOF pipes used to communicate between parent and child during rewrite. */
    int aof_pipe_write_data_to_child;
    int aof_pipe_read_data_from_parent;
    int aof_pipe_write_ack_to_parent;
    int aof_pipe_read_ack_from_child;
    int aof_pipe_write_ack_to_child;
    int aof_pipe_read_ack_from_parent;
    int aof_stop_sending_diff;     /* If true stop sending accumulated diffs
                                      to child process. */
    sds aof_child_diff;             /* AOF diff accumulator child side. */

    /* RDB persistence */
    long long dirty;                /* Changes to DB from the last save */
    long long dirty_before_bgsave;  /* Used to restore dirty on failed BGSAVE */
    pid_t rdb_child_pid;            /* PID of RDB saving child */
    struct saveparam *saveparams;   /* Save points array for RDB */
    int saveparamslen;              /* Number of saving points */
    char *rdb_filename;             /* Name of RDB file */
    int rdb_compression;            /* Use compression in RDB? */
    int rdb_checksum;               /* Use RDB checksum? */
    time_t lastsave;                /* Unix time of last successful save */
    time_t lastbgsave_try;          /* Unix time of last attempted bgsave */
    time_t rdb_save_time_last;      /* Time used by last RDB save run. */
    time_t rdb_save_time_start;     /* Current RDB save start time. */
    int rdb_child_type;             /* Type of save by active child. */
    int lastbgsave_status;          /* VR_OK or VR_ERROR */
    int stop_writes_on_bgsave_err;  /* Don't allow writes if can't BGSAVE */
    int rdb_pipe_write_result_to_parent; /* RDB pipes used to return the state */
    int rdb_pipe_read_result_from_child; /* of each slave in diskless SYNC. */

    /* Scripting */
    //lua_State *lua; /* The Lua interpreter. We use just one for all clients */
    struct client *lua_client;   /* The "fake client" to query Redis from Lua */
    struct client *lua_caller;   /* The client running EVAL right now, or NULL */
    dict *lua_scripts;         /* A dictionary of SHA1 -> Lua scripts */
    mstime_t lua_time_limit;  /* Script timeout in milliseconds */
    mstime_t lua_time_start;  /* Start time of script, milliseconds time */
    int lua_write_dirty;  /* True if a write command was called during the
                             execution of the current script. */
    int lua_random_dirty; /* True if a random command was called during the
                             execution of the current script. */
    int lua_replicate_commands; /* True if we are doing single commands repl. */
    int lua_multi_emitted;/* True if we already proagated MULTI. */
    int lua_repl;         /* Script replication flags for redis.set_repl(). */
    int lua_timedout;     /* True if we reached the time limit for script
                             execution. */
    int lua_kill;         /* Kill the script if true. */
    int lua_always_replicate_commands; /* Default replication type. */

    /* Blocked clients */
    dlist *ready_keys;        /* List of readyList structures for BLPOP & co */

    /* Propagation of commands in AOF / replication */
    redisOpArray also_propagate;    /* Additional command to propagate. */

    /* Pubsub */
    dict *pubsub_channels;  /* Map channels to list of subscribed clients */
    dlist *pubsub_patterns;  /* A list of pubsub_patterns */
    int notify_keyspace_events; /* Events to propagate via Pub/Sub. This is an
                                   xor of NOTIFY_... flags. */

    /* Fast pointers to often looked up command */
    struct redisCommand *delCommand, *multiCommand, *lpushCommand, *lpopCommand,
                        *rpopCommand, *sremCommand, *execCommand;

    /* System hardware info */
    size_t system_memory_size;  /* Total memory in system as reported by OS */
};

/* ZSETs use a specialized version of Skiplists */
typedef struct zskiplistNode {
    robj *obj;
    double score;
    struct zskiplistNode *backward;
    struct zskiplistLevel {
        struct zskiplistNode *forward;
        unsigned int span;
    } level[];
} zskiplistNode;

typedef struct zskiplist {
    struct zskiplistNode *header, *tail;
    unsigned long length;
    int level;
} zskiplist;

typedef struct zset {
    dict *dict;
    zskiplist *zsl;
} zset;

/* Structure to hold list iteration abstraction. */
typedef struct {
    robj *subject;
    unsigned char encoding;
    unsigned char direction; /* Iteration direction */
    quicklistIter *iter;
} listTypeIterator;

/* Structure for an entry while iterating over a list. */
typedef struct {
    listTypeIterator *li;
    quicklistEntry entry; /* Entry in quicklist */
} listTypeEntry;

/* Structure to hold set iteration abstraction. */
typedef struct {
    robj *subject;
    int encoding;
    int ii; /* intset iterator */
    dictIterator *di;
} setTypeIterator;

/* Structure to hold hash iteration abstraction. Note that iteration over
 * hashes involves both fields and values. Because it is possible that
 * not both are required, store pointers in the iterator to avoid
 * unnecessary memory allocation for fields/values. */
typedef struct {
    robj *subject;
    int encoding;

    unsigned char *fptr, *vptr;

    dictIterator *di;
    dictEntry *de;
} hashTypeIterator;

struct sharedObjectsStruct {
    robj *crlf, *ok, *err, *emptybulk, *czero, *cone, *cnegone, *pong, *space,
    *colon, *nullbulk, *nullmultibulk, *queued,
    *emptymultibulk, *wrongtypeerr, *nokeyerr, *syntaxerr, *sameobjecterr,
    *outofrangeerr, *noscripterr, *loadingerr, *slowscripterr, *bgsaveerr,
    *masterdownerr, *roslaveerr, *execaborterr, *noautherr, *noadminerr, *noreplicaserr,
    *busykeyerr, *oomerr, *plus, *messagebulk, *pmessagebulk, *subscribebulk,
    *unsubscribebulk, *psubscribebulk, *punsubscribebulk, *del, *rpop, *lpop,
    *lpush, *emptyscan, *minstring, *maxstring,
    *select[PROTO_SHARED_SELECT_CMDS],
    *integers[OBJ_SHARED_INTEGERS],
    *mbulkhdr[OBJ_SHARED_BULKHDR_LEN], /* "*<value>\r\n" */
    *bulkhdr[OBJ_SHARED_BULKHDR_LEN],  /* "$<value>\r\n" */
    *outofcomplexitylimit,
    *sentinel;  /* NULL pointer */
};


extern struct vr_server server;
extern struct sharedObjectsStruct shared;;
extern dictType hashDictType;
extern dictType setDictType;
extern dictType zsetDictType;

#define serverPanic(_e) _log(__FILE__, __LINE__, LOG_EMERG, 1, "assert faild: %s", #_e)
#define serverAssertWithInfo(_c,_o,_e) ((_e)?(void)0 : (_log(__FILE__, __LINE__, LOG_EMERG, 1, "assert faild: %s", #_e)))

unsigned int dictStrHash(const void *key);
unsigned int dictStrCaseHash(const void *key);
unsigned int dictSdsHash(const void *key);
unsigned int dictSdsCaseHash(const void *key);
int dictStrKeyCompare(void *privdata, const void *key1, const void *key2);
int dictStrKeyCaseCompare(void *privdata, const void *key1, const void *key2);
int dictSdsKeyCompare(void *privdata, const void *key1, const void *key2);
int dictSdsKeyCaseCompare(void *privdata, const void *key1, const void *key2);
void *dictSdsKeyDupFromStr(void *privdata, const void *key);
void dictSdsDestructor(void *privdata, void *val);
void dictObjectDestructor(void *privdata, void *val);
int dictEncObjKeyCompare(void *privdata, const void *key1, const void *key2);
unsigned int dictEncObjHash(const void *key);
unsigned int dictObjHash(const void *key);
int dictObjKeyCompare(void *privdata, const void *key1, const void *key2);
void dictListDestructor(void *privdata, void *val);

int init_server(struct instance *nci);

unsigned int getLRUClock(void);

int freeMemoryIfNeeded(vr_eventloop *vel);
void pingCommand(struct client *c);
int time_independent_strcmp(char *a, char *b);
void authCommand(struct client *c) ;
void adminCommand(struct client *c) ;

int htNeedsResize(dict *dict);

sds genVireInfoString(vr_eventloop *vel, char *section);
void infoCommand(client *c);
void echoCommand(client *c);
void timeCommand(client *c);

int adjustOpenFilesLimit(int maxclients);

#endif


================================================
FILE: src/vr_signal.c
================================================
#include <stdlib.h>
#include <signal.h>

#include <vr_core.h>
#include <vr_signal.h>

static struct signal signals[] = {
    { SIGUSR1, "SIGUSR1", 0,                 signal_handler },
    { SIGUSR2, "SIGUSR2", 0,                 signal_handler },
    { SIGTTIN, "SIGTTIN", 0,                 signal_handler },
    { SIGTTOU, "SIGTTOU", 0,                 signal_handler },
    { SIGHUP,  "SIGHUP",  0,                 signal_handler },
    { SIGINT,  "SIGINT",  0,                 signal_handler },
    { SIGSEGV, "SIGSEGV", (int)SA_RESETHAND, signal_handler },
    { SIGPIPE, "SIGPIPE", 0,                 SIG_IGN },
    { 0,        NULL,     0,                 NULL }
};

rstatus_t
signal_init(void)
{
    struct signal *sig;

    for (sig = signals; sig->signo != 0; sig++) {
        rstatus_t status;
        struct sigaction sa;

        memset(&sa, 0, sizeof(sa));
        sa.sa_handler = sig->handler;
        sa.sa_flags = sig->flags;
        sigemptyset(&sa.sa_mask);

        status = sigaction(sig->signo, &sa, NULL);
        if (status < 0) {
            log_error("sigaction(%s) failed: %s", sig->signame,
                      strerror(errno));
            return VR_ERROR;
        }
    }

    return VR_OK;
}

void
signal_deinit(void)
{
}

void
signal_handler(int signo)
{
    struct signal *sig;
    void (*action)(void);
    char *actionstr;
    bool done;

    for (sig = signals; sig->signo != 0; sig++) {
        if (sig->signo == signo) {
            break;
        }
    }
    ASSERT(sig->signo != 0);

    actionstr = "";
    action = NULL;
    done = false;

    switch (signo) {
    case SIGUSR1:
        break;

    case SIGUSR2:
        break;

    case SIGTTIN:
        actionstr = ", up logging level";
        action = log_level_up;
        break;

    case SIGTTOU:
        actionstr = ", down logging level";
        action = log_level_down;
        break;

    case SIGHUP:
        actionstr = ", reopening log file";
        action = log_reopen;
        break;

    case SIGINT:
        done = true;
        actionstr = ", exiting";
        break;

    case SIGSEGV:
        log_stacktrace();
        actionstr = ", core dumping";
        raise(SIGSEGV);
        break;

    default:
        NOT_REACHED();
    }

    log_safe("signal %d (%s) received%s", signo, sig->signame, actionstr);

    if (action != NULL) {
        action();
    }

    if (done) {
        exit(1);
    }
}


================================================
FILE: src/vr_signal.h
================================================
#ifndef _VR_SIGNAL_H_
#define _VR_SIGNAL_H_

struct signal {
    int  signo;
    char *signame;
    int  flags;
    void (*handler)(int signo);
};

rstatus_t signal_init(void);
void signal_deinit(void);
void signal_handler(int signo);

#endif


================================================
FILE: src/vr_slowlog.c
================================================
#include <vr_core.h>

static pthread_rwlock_t rwlocker;
static dlist *slowlog;                  /* SLOWLOG list of commands */
static long long slowlog_entry_id;     /* SLOWLOG current entry ID */

/* Create a new slowlog entry.
 * Incrementing the ref count of all the objects retained is up to
 * this function. */
slowlogEntry *slowlogCreateEntry(robj **argv, int argc, long long duration) {
    slowlogEntry *se = dalloc(sizeof(*se));
    int j, slargc = argc;

    if (slargc > SLOWLOG_ENTRY_MAX_ARGC) slargc = SLOWLOG_ENTRY_MAX_ARGC;
    se->argc = slargc;
    se->argv = dalloc(sizeof(robj*)*slargc);
    for (j = 0; j < slargc; j++) {
        /* Logging too many arguments is a useless memory waste, so we stop
         * at SLOWLOG_ENTRY_MAX_ARGC, but use the last argument to specify
         * how many remaining arguments there were in the original command. */
        if (slargc != argc && j == slargc-1) {
            se->argv[j] = createObject(OBJ_STRING,
                sdscatprintf(sdsempty(),"... (%d more arguments)",
                argc-slargc+1));
        } else {
            /* Trim too long strings as well... */
            if (argv[j]->type == OBJ_STRING &&
                sdsEncodedObject(argv[j]) &&
                sdslen(argv[j]->ptr) > SLOWLOG_ENTRY_MAX_STRING)
            {
                sds s = sdsnewlen(argv[j]->ptr, SLOWLOG_ENTRY_MAX_STRING);

                s = sdscatprintf(s,"... (%lu more bytes)",
                    (unsigned long)
                    sdslen(argv[j]->ptr) - SLOWLOG_ENTRY_MAX_STRING);
                se->argv[j] = createObject(OBJ_STRING,s);
            } else {
                se->argv[j] = dupStringObjectUnconstant(argv[j]);
            }
        }
    }
    se->time = time(NULL);
    se->duration = duration;
    return se;
}

/* Free a slow log entry. The argument is void so that the prototype of this
 * function matches the one of the 'free' method of adlist.c.
 *
 * This function will take care to release all the retained object. */
void slowlogFreeEntry(void *septr) {
    slowlogEntry *se = septr;
    int j;

    for (j = 0; j < se->argc; j++)
        freeObject(se->argv[j]);
    dfree(se->argv);
    dfree(se);
}

/* Initialize the slow log. This function should be called a single time
 * at server startup. */
void slowlogInit(void) {
    pthread_rwlock_init(&rwlocker,NULL);
    slowlog = dlistCreate();
    slowlog_entry_id = 0;
    dlistSetFreeMethod(slowlog,slowlogFreeEntry);
}

/* Push a new entry into the slow log.
 * This function will make sure to trim the slow log accordingly to the
 * configured max length. */
void slowlogPushEntryIfNeeded(vr_eventloop *vel, robj **argv, int argc, long long duration) {
    long long slowlog_log_slower_than;
    int slowlog_max_len;
    
    slowlog_log_slower_than = vel->cc.slowlog_log_slower_than;
    if (slowlog_log_slower_than < 0) return; /* Slowlog disabled */
    if (duration >= slowlog_log_slower_than) {
        slowlogEntry *se = slowlogCreateEntry(argv,argc,duration);
        pthread_rwlock_wrlock(&rwlocker);
        se->id = slowlog_entry_id++;
        dlistAddNodeHead(slowlog,se);
        pthread_rwlock_unlock(&rwlocker);
    }

    conf_server_get(CONFIG_SOPN_SLOWLOGML,&slowlog_max_len);
    /* Remove old entries if needed. */
    pthread_rwlock_wrlock(&rwlocker);
    while (dlistLength(slowlog) > slowlog_max_len)
        dlistDelNode(slowlog,dlistLast(slowlog));
    pthread_rwlock_unlock(&rwlocker);
}

/* Remove all the entries from the current slow log. */
void slowlogReset(void) {
    pthread_rwlock_wrlock(&rwlocker);
    while (dlistLength(slowlog) > 0)
        dlistDelNode(slowlog,dlistLast(slowlog));
    pthread_rwlock_unlock(&rwlocker);
}

/* The SLOWLOG command. Implements all the subcommands needed to handle the
 * Redis slow log. */
void slowlogCommand(client *c) {
    if (c->argc == 2 && !strcasecmp(c->argv[1]->ptr,"reset")) {
        slowlogReset();
        addReply(c,shared.ok);
    } else if (c->argc == 2 && !strcasecmp(c->argv[1]->ptr,"len")) {
        unsigned long len;
        pthread_rwlock_rdlock(&rwlocker);
        len = dlistLength(slowlog);
        pthread_rwlock_unlock(&rwlocker);
        addReplyLongLong(c,len);
    } else if ((c->argc == 2 || c->argc == 3) &&
               !strcasecmp(c->argv[1]->ptr,"get"))
    {
        long count = 10, sent = 0;
        dlistIter li;
        void *totentries;
        dlistNode *ln;
        slowlogEntry *se;

        if (c->argc == 3 &&
            getLongFromObjectOrReply(c,c->argv[2],&count,NULL) != VR_OK)
            return;

        pthread_rwlock_rdlock(&rwlocker);
        dlistRewind(slowlog,&li);
        totentries = addDeferredMultiBulkLength(c);
        while(count-- && (ln = dlistNext(&li))) {
            int j;

            se = ln->value;
            addReplyMultiBulkLen(c,4);
            addReplyLongLong(c,se->id);
            addReplyLongLong(c,se->time);
            addReplyLongLong(c,se->duration);
            addReplyMultiBulkLen(c,se->argc);
            for (j = 0; j < se->argc; j++)
                addReplyBulk(c,se->argv[j]);
            sent++;
        }
        pthread_rwlock_unlock(&rwlocker);
        setDeferredMultiBulkLength(c,totentries,sent);
    } else {
        addReplyError(c,
            "Unknown SLOWLOG subcommand or wrong # of args. Try GET, RESET, LEN.");
    }
}


================================================
FILE: src/vr_slowlog.h
================================================
#ifndef _VR_SLOWLOG_H_
#define _VR_SLOWLOG_H_

#define SLOWLOG_ENTRY_MAX_ARGC 32
#define SLOWLOG_ENTRY_MAX_STRING 128

/* This structure defines an entry inside the slow log list */
typedef struct slowlogEntry {
    robj **argv;
    int argc;
    long long id;       /* Unique entry identifier. */
    long long duration; /* Time spent by the query, in nanoseconds. */
    time_t time;        /* Unix time at which the query was executed. */
} slowlogEntry;

/* Exported API */
void slowlogInit(void);
void slowlogPushEntryIfNeeded(vr_eventloop *vel, robj **argv, int argc, long long duration);

/* Exported commands */
void slowlogCommand(client *c);

#endif


================================================
FILE: src/vr_stats.c
================================================
#include <vr_core.h>

int
vr_stats_init(vr_stats *stats)
{
    rstatus_t ret;

    if (stats == NULL) {
        return VR_ERROR;
    }

    stats->starttime = 0;
    stats->numcommands = 0;
    stats->numconnections = 0;
    stats->expiredkeys = 0;
    stats->evictedkeys = 0;
    stats->keyspace_hits = 0;
    stats->keyspace_misses = 0;
    stats->rejected_conn = 0;
    stats->sync_full = 0;
    stats->sync_partial_ok = 0;
    stats->sync_partial_err = 0;
    stats->net_input_bytes = 0;
    stats->net_output_bytes = 0;
    stats->peak_memory = 0;
    
#if !defined(STATS_ATOMIC_FIRST) || (!defined(__ATOMIC_RELAXED) && !defined(HAVE_ATOMIC))
    ret = pthread_spin_init(&stats->statslock, 0);
    if (ret != 0) {
        return VR_ERROR;
    }
#endif

    stats->starttime = time(NULL);

    return VR_OK;
}

void
vr_stats_deinit(vr_stats *stats)
{
    if (stats == NULL) {
        return;
    }

    stats->starttime = 0;
    stats->numcommands = 0;
    stats->numconnections = 0;
    stats->expiredkeys = 0;
    stats->evictedkeys = 0;
    stats->keyspace_hits = 0;
    stats->keyspace_misses = 0;
    stats->rejected_conn = 0;
    stats->sync_full = 0;
    stats->sync_partial_ok = 0;
    stats->sync_partial_err = 0;
    stats->net_input_bytes = 0;
    stats->net_output_bytes = 0;
    
#if !defined(STATS_ATOMIC_FIRST) || (!defined(__ATOMIC_RELAXED) && !defined(HAVE_ATOMIC))
    pthread_spin_destroy(&stats->statslock);
#endif
}

/* Add a sample to the operations per second array of samples. */
void trackInstantaneousMetric(vr_stats *stats, int metric, long long current_reading) {
    long long t = vr_msec_now() - stats->inst_metric[metric].last_sample_time;
    long long ops = current_reading -
                    stats->inst_metric[metric].last_sample_count;
    long long ops_sec;

    ops_sec = t > 0 ? (ops*1000/t) : 0;
    
    update_stats_set(stats,inst_metric[metric].samples[stats->inst_metric[metric].idx],ops_sec);
    stats->inst_metric[metric].idx++;
    stats->inst_metric[metric].idx %= STATS_METRIC_SAMPLES;
    stats->inst_metric[metric].last_sample_time = vr_msec_now();
    stats->inst_metric[metric].last_sample_count = current_reading;
}

/* Return the mean of all the samples. */
long long getInstantaneousMetric(vr_stats *stats, int metric) {
    int j;
    long long sum = 0;

    for (j = 0; j < STATS_METRIC_SAMPLES; j++) {
        long long value;
        update_stats_get(stats, inst_metric[metric].samples[j], &value);
        sum += value;
    }
    return sum / STATS_METRIC_SAMPLES;
}


================================================
FILE: src/vr_stats.h
================================================
#ifndef _VR_STATS_H_
#define _VR_STATS_H_

#if 1
#define STATS_ATOMIC_FIRST 1
#endif

/* Instantaneous metrics tracking. */
#define STATS_METRIC_SAMPLES 16     /* Number of samples per metric. */
#define STATS_METRIC_COMMAND 0      /* Number of commands executed. */
#define STATS_METRIC_NET_INPUT 1    /* Bytes read to network .*/
#define STATS_METRIC_NET_OUTPUT 2   /* Bytes written to network. */
#define STATS_METRIC_COUNT 3

typedef struct vr_stats {
    /* Fields used only for stats */
    time_t starttime;          /* Server start time */
    long long numcommands;     /* Number of processed commands */
    long long numconnections;  /* Number of connections received */
    long long expiredkeys;     /* Number of expired keys */
    long long evictedkeys;     /* Number of evicted keys (maxmemory) */
    long long keyspace_hits;   /* Number of successful lookups of keys */
    long long keyspace_misses; /* Number of failed lookups of keys */
    long long rejected_conn;   /* Clients rejected because of maxclients */
    long long sync_full;       /* Number of full resyncs with slaves. */
    long long sync_partial_ok; /* Number of accepted PSYNC requests. */
    long long sync_partial_err;/* Number of unaccepted PSYNC requests. */
    long long net_input_bytes; /* Bytes read from network. */
    long long net_output_bytes; /* Bytes written to network. */
    size_t    peak_memory;     /* Max used memory record */
    
    /* The following two are used to track instantaneous metrics, like
     * number of operations per second, network traffic. */
    struct {
        long long last_sample_time; /* Timestamp of last sample in ms */
        long long last_sample_count;/* Count in last sample */
        long long samples[STATS_METRIC_SAMPLES];
        int idx;
    } inst_metric[STATS_METRIC_COUNT];

#if !defined(STATS_ATOMIC_FIRST) || (!defined(__ATOMIC_RELAXED) && !defined(HAVE_ATOMIC))
    pthread_spinlock_t statslock;
#endif
}vr_stats;

/* GCC version >= 4.7 */
#if defined(__ATOMIC_RELAXED) && defined(STATS_ATOMIC_FIRST)
#define update_stats_add(_stats, _field, _n) __atomic_add_fetch(&(_stats)->_field, (_n), __ATOMIC_RELAXED)
#define update_stats_sub(_stats, _field, _n) __atomic_sub_fetch(&(_stats)->_field, (_n), __ATOMIC_RELAXED)
#define update_stats_set(_stats, _field, _n) __atomic_store_n(&(_stats)->_field, (_n), __ATOMIC_RELAXED)
#define update_stats_get(_stats, _field, _v) do {           \
    __atomic_load(&(_stats)->_field, _v, __ATOMIC_RELAXED); \
} while(0)

#define STATS_LOCK_TYPE "__ATOMIC_RELAXED"
/* GCC version >= 4.1 */
#elif defined(HAVE_ATOMIC) && defined(STATS_ATOMIC_FIRST)
#define update_stats_add(_stats, _field, _n) __sync_add_and_fetch(&(_stats)->_field, (_n))
#define update_stats_sub(_stats, _field, _n) __sync_sub_and_fetch(&(_stats)->_field, (_n))
#define update_stats_set(_stats, _field, _n) __sync_lock_test_and_set(&(_stats)->_field, (_n))
#define update_stats_get(_stats, _field, _v) do {           \
    (*_v) = __sync_add_and_fetch(&(_stats)->_field, 0);     \
} while(0)

#define STATS_LOCK_TYPE "HAVE_ATOMIC"
#else
#define update_stats_add(_stats, _field, _n) do {   \
    pthread_spin_lock(&(_stats)->statslock);        \
    (_stats)->_field += (_n);                       \
    pthread_spin_unlock(&(_stats)->statslock);      \
} while(0)

#define update_stats_sub(_stats, _field, _n) do {   \
    pthread_spin_lock(&(_stats)->statslock);        \
    (_stats)->_field -= (_n);                       \
    pthread_spin_unlock(&(_stats)->statslock);      \
} while(0)

#define update_stats_set(_stats, _field, _n) do {   \
    pthread_spin_lock(&(_stats)->statslock);        \
    (_stats)->_field = (_n);                        \
    pthread_spin_unlock(&(_stats)->statslock);      \
} while(0)

#define update_stats_get(_stats, _field, _v) do {   \
    pthread_spin_lock(&(_stats)->statslock);        \
    (*_v) = (_stats)->_field;                       \
    pthread_spin_unlock(&(_stats)->statslock);      \
} while(0)

#define STATS_LOCK_TYPE "pthread_spin_lock"
#endif

int vr_stats_init(vr_stats *stats);
void vr_stats_deinit(vr_stats *stats);

void trackInstantaneousMetric(vr_stats *stats, int metric, long long current_reading);
long long getInstantaneousMetric(vr_stats *stats, int metric);

#endif


================================================
FILE: src/vr_t_hash.c
================================================
#include <math.h>

#include <vr_core.h>

/*-----------------------------------------------------------------------------
 * Hash type API
 *----------------------------------------------------------------------------*/

/* Check the length of a number of objects to see if we need to convert a
 * ziplist to a real hash. Note that we only check string encoded objects
 * as their string length can be queried in constant time. */
void hashTypeTryConversion(robj *o, robj **argv, int start, int end) {
    int i;

    if (o->encoding != OBJ_ENCODING_ZIPLIST) return;

    for (i = start; i <= end; i++) {
        if (sdsEncodedObject(argv[i]) &&
            sdslen(argv[i]->ptr) > server.hash_max_ziplist_value)
        {
            hashTypeConvert(o, OBJ_ENCODING_HT);
            break;
        }
    }
}

/* Encode given objects in-place when the hash uses a dict. */
void hashTypeTryObjectEncoding(robj *subject, robj **o1, robj **o2) {
    if (subject->encoding == OBJ_ENCODING_HT) {
        if (o1) *o1 = tryObjectEncoding(*o1);
        if (o2) *o2 = tryObjectEncoding(*o2);
    }
}

/* Get the value from a ziplist encoded hash, identified by field.
 * Returns -1 when the field cannot be found. */
int hashTypeGetFromZiplist(robj *o, robj *field,
                           unsigned char **vstr,
                           unsigned int *vlen,
                           long long *vll)
{
    unsigned char *zl, *fptr = NULL, *vptr = NULL;
    int ret;
    robj *field_new;

    ASSERT(o->encoding == OBJ_ENCODING_ZIPLIST);

    field_new = getDecodedObject(field);

    zl = o->ptr;
    fptr = ziplistIndex(zl, ZIPLIST_HEAD);
    if (fptr != NULL) {
        fptr = ziplistFind(fptr, field_new->ptr, sdslen(field_new->ptr), 1);
        if (fptr != NULL) {
            /* Grab pointer to the value (fptr points to the field) */
            vptr = ziplistNext(zl, fptr);
            ASSERT(vptr != NULL);
        }
    }

    if (field_new != field) freeObject(field_new);

    if (vptr != NULL) {
        ret = ziplistGet(vptr, vstr, vlen, vll);
        ASSERT(ret);
        return 0;
    }

    return -1;
}

/* Get the value from a hash table encoded hash, identified by field.
 * Returns -1 when the field cannot be found. */
int hashTypeGetFromHashTable(robj *o, robj *field, robj **value) {
    dictEntry *de;

    ASSERT(o->encoding == OBJ_ENCODING_HT);

    de = dictFind(o->ptr, field);
    if (de == NULL) return -1;
    *value = dictGetVal(de);
    return 0;
}

/* Higher level function of hashTypeGet*() that always returns a Redis
 * object (either new or with refcount incremented), so that the caller
 * can retain a reference or call decrRefCount after the usage.
 *
 * The lower level function can prevent copy on write so it is
 * the preferred way of doing read operations. */
robj *hashTypeGetObject(robj *o, robj *field) {
    robj *value = NULL;

    if (o->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *vstr = NULL;
        unsigned int vlen = UINT_MAX;
        long long vll = LLONG_MAX;

        if (hashTypeGetFromZiplist(o, field, &vstr, &vlen, &vll) == 0) {
            if (vstr) {
                value = createStringObject((char*)vstr, vlen);
            } else {
                value = createStringObjectFromLongLong(vll);
            }
        }
    } else if (o->encoding == OBJ_ENCODING_HT) {
        robj *aux;

        if (hashTypeGetFromHashTable(o, field, &aux) == 0) {
            value = aux;
        }
    } else {
        serverPanic("Unknown hash encoding");
    }
    return value;
}

/* Higher level function using hashTypeGet*() to return the length of the
 * object associated with the requested field, or 0 if the field does not
 * exist. */
size_t hashTypeGetValueLength(robj *o, robj *field) {
    size_t len = 0;
    if (o->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *vstr = NULL;
        unsigned int vlen = UINT_MAX;
        long long vll = LLONG_MAX;

        if (hashTypeGetFromZiplist(o, field, &vstr, &vlen, &vll) == 0)
            len = vstr ? vlen : sdigits10(vll);
    } else if (o->encoding == OBJ_ENCODING_HT) {
        robj *aux;

        if (hashTypeGetFromHashTable(o, field, &aux) == 0)
            len = stringObjectLen(aux);
    } else {
        serverPanic("Unknown hash encoding");
    }
    return len;
}

/* Test if the specified field exists in the given hash. Returns 1 if the field
 * exists, and 0 when it doesn't. */
int hashTypeExists(robj *o, robj *field) {
    if (o->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *vstr = NULL;
        unsigned int vlen = UINT_MAX;
        long long vll = LLONG_MAX;

        if (hashTypeGetFromZiplist(o, field, &vstr, &vlen, &vll) == 0) return 1;
    } else if (o->encoding == OBJ_ENCODING_HT) {
        robj *aux;

        if (hashTypeGetFromHashTable(o, field, &aux) == 0) return 1;
    } else {
        serverPanic("Unknown hash encoding");
    }
    return 0;
}

/* Add an element, discard the old if the key already exists.
 * Return 0 on insert and 1 on update.
 * This function will take care of dump the fields and value 
 * objects when insert into the hash table.
 * Filed and value objects just borrow to hashTypeSet(). */
int hashTypeSet(robj *o, robj *field, robj *value) {
    int update = 0;
    robj *field_new, *value_new;

    if (o->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl, *fptr, *vptr;

        field_new = getDecodedObject(field);
        value_new = getDecodedObject(value);

        zl = o->ptr;
        fptr = ziplistIndex(zl, ZIPLIST_HEAD);
        if (fptr != NULL) {
            fptr = ziplistFind(fptr, field_new->ptr, sdslen(field_new->ptr), 1);
            if (fptr != NULL) {
                /* Grab pointer to the value (fptr points to the field) */
                vptr = ziplistNext(zl, fptr);
                ASSERT(vptr != NULL);
                update = 1;

                /* Delete value */
                zl = ziplistDelete(zl, &vptr);

                /* Insert new value */
                zl = ziplistInsert(zl, vptr, value_new->ptr, sdslen(value_new->ptr));
            }
        }

        if (!update) {
            /* Push new field/value pair onto the tail of the ziplist */
            zl = ziplistPush(zl, field_new->ptr, sdslen(field_new->ptr), ZIPLIST_TAIL);
            zl = ziplistPush(zl, value_new->ptr, sdslen(value_new->ptr), ZIPLIST_TAIL);
        }
        o->ptr = zl;
        if (field_new != field) freeObject(field_new);
        if (value_new != value) freeObject(value_new);

        /* Check if the ziplist needs to be converted to a hash table */
        if (hashTypeLength(o) > server.hash_max_ziplist_entries)
            hashTypeConvert(o, OBJ_ENCODING_HT);
    } else if (o->encoding == OBJ_ENCODING_HT) {
        field_new = dupStringObjectUnconstant(field);
        value_new = dupStringObjectUnconstant(value);
        if (dictReplace(o->ptr, field_new, value_new)) { /* Insert */
            /* Do nothing */
        } else { /* Update */
            update = 1;
            freeObject(field_new);
        }
    } else {
        serverPanic("Unknown hash encoding");
    }
    return update;
}

/* Delete an element from a hash.
 * Return 1 on deleted and 0 on not found. */
int hashTypeDelete(robj *o, robj *field) {
    int deleted = 0;

    if (o->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl, *fptr;
        robj *field_new;

        field_new = getDecodedObject(field);

        zl = o->ptr;
        fptr = ziplistIndex(zl, ZIPLIST_HEAD);
        if (fptr != NULL) {
            fptr = ziplistFind(fptr, field_new->ptr, sdslen(field_new->ptr), 1);
            if (fptr != NULL) {
                zl = ziplistDelete(zl,&fptr);
                zl = ziplistDelete(zl,&fptr);
                o->ptr = zl;
                deleted = 1;
            }
        }

        if (field_new != field) freeObject(field_new);
    } else if (o->encoding == OBJ_ENCODING_HT) {
        if (dictDelete((dict*)o->ptr, field) == VR_OK) {
            deleted = 1;

            /* Always check if the dictionary needs a resize after a delete. */
            if (htNeedsResize(o->ptr)) dictResize(o->ptr);
        }

    } else {
        serverPanic("Unknown hash encoding");
    }

    return deleted;
}

/* Return the number of elements in a hash. */
unsigned long hashTypeLength(robj *o) {
    unsigned long length = ULONG_MAX;

    if (o->encoding == OBJ_ENCODING_ZIPLIST) {
        length = ziplistLen(o->ptr) / 2;
    } else if (o->encoding == OBJ_ENCODING_HT) {
        length = dictSize((dict*)o->ptr);
    } else {
        serverPanic("Unknown hash encoding");
    }

    return length;
}

hashTypeIterator *hashTypeInitIterator(robj *subject) {
    hashTypeIterator *hi = dalloc(sizeof(hashTypeIterator));
    hi->subject = subject;
    hi->encoding = subject->encoding;

    if (hi->encoding == OBJ_ENCODING_ZIPLIST) {
        hi->fptr = NULL;
        hi->vptr = NULL;
    } else if (hi->encoding == OBJ_ENCODING_HT) {
        hi->di = dictGetIterator(subject->ptr);
    } else {
        serverPanic("Unknown hash encoding");
    }

    return hi;
}

void hashTypeReleaseIterator(hashTypeIterator *hi) {
    if (hi->encoding == OBJ_ENCODING_HT) {
        dictReleaseIterator(hi->di);
    }

    dfree(hi);
}

/* Move to the next entry in the hash. Return VR_OK when the next entry
 * could be found and VR_ERROR when the iterator reaches the end. */
int hashTypeNext(hashTypeIterator *hi) {
    if (hi->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl;
        unsigned char *fptr, *vptr;

        zl = hi->subject->ptr;
        fptr = hi->fptr;
        vptr = hi->vptr;

        if (fptr == NULL) {
            /* Initialize cursor */
            ASSERT(vptr == NULL);
            fptr = ziplistIndex(zl, 0);
        } else {
            /* Advance cursor */
            ASSERT(vptr != NULL);
            fptr = ziplistNext(zl, vptr);
        }
        if (fptr == NULL) return VR_ERROR;

        /* Grab pointer to the value (fptr points to the field) */
        vptr = ziplistNext(zl, fptr);
        ASSERT(vptr != NULL);

        /* fptr, vptr now point to the first or next pair */
        hi->fptr = fptr;
        hi->vptr = vptr;
    } else if (hi->encoding == OBJ_ENCODING_HT) {
        if ((hi->de = dictNext(hi->di)) == NULL) return VR_ERROR;
    } else {
        serverPanic("Unknown hash encoding");
    }
    return VR_OK;
}

/* Get the field or value at iterator cursor, for an iterator on a hash value
 * encoded as a ziplist. Prototype is similar to `hashTypeGetFromZiplist`. */
void hashTypeCurrentFromZiplist(hashTypeIterator *hi, int what,
                                unsigned char **vstr,
                                unsigned int *vlen,
                                long long *vll)
{
    int ret;

    ASSERT(hi->encoding == OBJ_ENCODING_ZIPLIST);

    if (what & OBJ_HASH_KEY) {
        ret = ziplistGet(hi->fptr, vstr, vlen, vll);
        ASSERT(ret);
    } else {
        ret = ziplistGet(hi->vptr, vstr, vlen, vll);
        ASSERT(ret);
    }
}

/* Get the field or value at iterator cursor, for an iterator on a hash value
 * encoded as a ziplist. Prototype is similar to `hashTypeGetFromHashTable`. */
void hashTypeCurrentFromHashTable(hashTypeIterator *hi, int what, robj **dst) {
    ASSERT(hi->encoding == OBJ_ENCODING_HT);

    if (what & OBJ_HASH_KEY) {
        *dst = dictGetKey(hi->de);
    } else {
        *dst = dictGetVal(hi->de);
    }
}

/* A non copy-on-write friendly but higher level version of hashTypeCurrent*()
 * that returns an object with incremented refcount (or a new object). It is up
 * to the caller to decrRefCount() the object if no reference is retained. */
robj *hashTypeCurrentObject(hashTypeIterator *hi, int what) {
    robj *dst;

    if (hi->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *vstr = NULL;
        unsigned int vlen = UINT_MAX;
        long long vll = LLONG_MAX;

        hashTypeCurrentFromZiplist(hi, what, &vstr, &vlen, &vll);
        if (vstr) {
            dst = createStringObject((char*)vstr, vlen);
        } else {
            dst = createStringObjectFromLongLong(vll);
        }
    } else if (hi->encoding == OBJ_ENCODING_HT) {
        hashTypeCurrentFromHashTable(hi, what, &dst);
    } else {
        serverPanic("Unknown hash encoding");
    }
    return dst;
}

robj *hashTypeLookupWriteOrCreate(client *c, robj *key, int *expired) {
    robj *o = lookupKeyWrite(c->db,key,expired);
    if (o == NULL) {
        o = createHashObject();
        dbAdd(c->db,key,o);
    } else {
        if (o->type != OBJ_HASH) {
            addReply(c,shared.wrongtypeerr);
            return NULL;
        }
    }
    return o;
}

void hashTypeConvertZiplist(robj *o, int enc) {
    ASSERT(o->encoding == OBJ_ENCODING_ZIPLIST);

    if (enc == OBJ_ENCODING_ZIPLIST) {
        /* Nothing to do... */

    } else if (enc == OBJ_ENCODING_HT) {
        hashTypeIterator *hi;
        dict *d;
        int ret;

        hi = hashTypeInitIterator(o);
        d = dictCreate(&hashDictType, NULL);

        while (hashTypeNext(hi) != VR_ERROR) {
            robj *field, *value;

            field = hashTypeCurrentObject(hi, OBJ_HASH_KEY);
            field = tryObjectEncoding(field);
            value = hashTypeCurrentObject(hi, OBJ_HASH_VALUE);
            value = tryObjectEncoding(value);
            ret = dictAdd(d, field, value);
            if (ret != DICT_OK) {
                //serverLogHexDump(LL_WARNING,"ziplist with dup elements dump",
                //    o->ptr,ziplistBlobLen(o->ptr));
                ASSERT(ret == DICT_OK);
            }
        }

        hashTypeReleaseIterator(hi);
        dfree(o->ptr);

        o->encoding = OBJ_ENCODING_HT;
        o->ptr = d;

    } else {
        serverPanic("Unknown hash encoding");
    }
}

void hashTypeConvert(robj *o, int enc) {
    if (o->encoding == OBJ_ENCODING_ZIPLIST) {
        hashTypeConvertZiplist(o, enc);
    } else if (o->encoding == OBJ_ENCODING_HT) {
        serverPanic("Not implemented");
    } else {
        serverPanic("Unknown hash encoding");
    }
}

/*-----------------------------------------------------------------------------
 * Hash type commands
 *----------------------------------------------------------------------------*/

void hsetCommand(client *c) {
    int update;
    robj *o;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    if ((o = hashTypeLookupWriteOrCreate(c,c->argv[1],&expired)) == NULL) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }
    hashTypeTryConversion(o,c->argv,2,3);
    hashTypeTryObjectEncoding(o,&c->argv[2], &c->argv[3]);
    update = hashTypeSet(o,c->argv[2],c->argv[3]);
    addReply(c, update ? shared.czero : shared.cone);
    signalModifiedKey(c->db,c->argv[1]);
    notifyKeyspaceEvent(NOTIFY_HASH,"hset",c->argv[1],c->db->id);
    c->vel->dirty++;
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void hsetnxCommand(client *c) {
    robj *o;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    if ((o = hashTypeLookupWriteOrCreate(c,c->argv[1],&expired)) == NULL) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }
    hashTypeTryConversion(o,c->argv,2,3);

    if (hashTypeExists(o, c->argv[2])) {
        addReply(c, shared.czero);
    } else {
        hashTypeTryObjectEncoding(o,&c->argv[2], &c->argv[3]);
        hashTypeSet(o,c->argv[2],c->argv[3]);
        addReply(c, shared.cone);
        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_HASH,"hset",c->argv[1],c->db->id);
        server.dirty++;
    }

    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void hmsetCommand(client *c) {
    int i;
    robj *o;
    int expired = 0;

    if ((c->argc % 2) == 1) {
        addReplyError(c,"wrong number of arguments for HMSET");
        return;
    }

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    if ((o = hashTypeLookupWriteOrCreate(c,c->argv[1],&expired)) == NULL) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }
    hashTypeTryConversion(o,c->argv,2,c->argc-1);
    for (i = 2; i < c->argc; i += 2) {
        hashTypeTryObjectEncoding(o,&c->argv[i], &c->argv[i+1]);
        hashTypeSet(o,c->argv[i],c->argv[i+1]);
    }
    addReply(c, shared.ok);
    signalModifiedKey(c->db,c->argv[1]);
    notifyKeyspaceEvent(NOTIFY_HASH,"hset",c->argv[1],c->db->id);
    c->vel->dirty++;
    
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void hincrbyCommand(client *c) {
    long long value, incr, oldvalue;
    robj *o, *current, *new;
    int expired = 0;

    if (getLongLongFromObjectOrReply(c,c->argv[3],&incr,NULL) != VR_OK) return;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    if ((o = hashTypeLookupWriteOrCreate(c,c->argv[1],&expired)) == NULL) goto end;
    if ((current = hashTypeGetObject(o,c->argv[2])) != NULL) {
        if (getLongLongFromObjectOrReply(c,current,&value,
            "hash value is not an integer") != VR_OK) {
            if (o->encoding == OBJ_ENCODING_ZIPLIST) freeObject(current);
            goto end;
        }
        if (o->encoding == OBJ_ENCODING_ZIPLIST) freeObject(current);
    } else {
        value = 0;
    }

    oldvalue = value;
    if ((incr < 0 && oldvalue < 0 && incr < (LLONG_MIN-oldvalue)) ||
        (incr > 0 && oldvalue > 0 && incr > (LLONG_MAX-oldvalue))) {
        addReplyError(c,"increment or decrement would overflow");
        goto end;
    }
    value += incr;
    new = createStringObjectFromLongLong(value);
    hashTypeTryObjectEncoding(o,&c->argv[2],NULL);
    hashTypeSet(o,c->argv[2],new);
    freeObject(new);
    addReplyLongLong(c,value);
    signalModifiedKey(c->db,c->argv[1]);
    notifyKeyspaceEvent(NOTIFY_HASH,"hincrby",c->argv[1],c->db->id);
    c->vel->dirty++;

end:
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
}

void hincrbyfloatCommand(client *c) {
    double long value, incr;
    robj *o, *current, *new, *aux;
    int expired = 0;

    if (getLongDoubleFromObjectOrReply(c,c->argv[3],&incr,NULL) != VR_OK) return;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    if ((o = hashTypeLookupWriteOrCreate(c,c->argv[1],&expired)) == NULL) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
        return;
    }
    if ((current = hashTypeGetObject(o,c->argv[2])) != NULL) {
        if (getLongDoubleFromObjectOrReply(c,current,&value,
            "hash value is not a valid float") != VR_OK) {
            if (o->encoding == OBJ_ENCODING_ZIPLIST) freeObject(current);
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
            return;
        }
        if (o->encoding == OBJ_ENCODING_ZIPLIST) freeObject(current);
    } else {
        value = 0;
    }

    value += incr;
    new = createStringObjectFromLongDouble(value,1);
    hashTypeTryObjectEncoding(o,&c->argv[2],NULL);
    hashTypeSet(o,c->argv[2],new);
    addReplyBulk(c,new);
    signalModifiedKey(c->db,c->argv[1]);
    notifyKeyspaceEvent(NOTIFY_HASH,"hincrbyfloat",c->argv[1],c->db->id);
    c->vel->dirty++;

    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);

    /* Always replicate HINCRBYFLOAT as an HSET command with the final value
     * in order to make sure that differences in float pricision or formatting
     * will not create differences in replicas or after an AOF restart. */
    aux = createStringObject("HSET",4);
    rewriteClientCommandArgument(c,0,aux);
    rewriteClientCommandArgument(c,3,new);
}

static void addHashFieldToReply(client *c, robj *o, robj *field) {
    int ret;

    if (o == NULL) {
        addReply(c, shared.nullbulk);
        return;
    }

    if (o->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *vstr = NULL;
        unsigned int vlen = UINT_MAX;
        long long vll = LLONG_MAX;

        ret = hashTypeGetFromZiplist(o, field, &vstr, &vlen, &vll);
        if (ret < 0) {
            addReply(c, shared.nullbulk);
        } else {
            if (vstr) {
                addReplyBulkCBuffer(c, vstr, vlen);
            } else {
                addReplyBulkLongLong(c, vll);
            }
        }

    } else if (o->encoding == OBJ_ENCODING_HT) {
        robj *value;

        ret = hashTypeGetFromHashTable(o, field, &value);
        if (ret < 0) {
            addReply(c, shared.nullbulk);
        } else {
            addReplyBulk(c, value);
        }

    } else {
        serverPanic("Unknown hash encoding");
    }
}

void hgetCommand(client *c) {
    robj *o;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.nullbulk)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_HASH)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    
    addHashFieldToReply(c, o, c->argv[2]);
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void hmgetCommand(client *c) {
    robj *o;
    int i;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    /* Don't abort when the key cannot be found. Non-existing keys are empty
     * hashes, where HMGET should respond with a series of null bulks. */
    o = lookupKeyRead(c->db, c->argv[1]);
    if (o != NULL && o->type != OBJ_HASH) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        addReply(c, shared.wrongtypeerr);
        return;
    }

    addReplyMultiBulkLen(c, c->argc-2);
    for (i = 2; i < c->argc; i++) {
        addHashFieldToReply(c, o, c->argv[i]);
    }

    if (o == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    }

    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void hdelCommand(client *c) {
    robj *o;
    int j, deleted = 0, keyremoved = 0;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    if ((o = lookupKeyWriteOrReply(c,c->argv[1],shared.czero,&expired)) == NULL ||
        checkType(c,o,OBJ_HASH)) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }

    for (j = 2; j < c->argc; j++) {
        if (hashTypeDelete(o,c->argv[j])) {
            deleted++;
            if (hashTypeLength(o) == 0) {
                dbDelete(c->db,c->argv[1]);
                keyremoved = 1;
                break;
            }
        }
    }

    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
    
    if (deleted) {
        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_HASH,"hdel",c->argv[1],c->db->id);
        if (keyremoved)
            notifyKeyspaceEvent(NOTIFY_GENERIC,"del",c->argv[1],
                                c->db->id);
        server.dirty += deleted;
    }
    addReplyLongLong(c,deleted);
}

void hlenCommand(client *c) {
    robj *o;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_HASH)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    
    addReplyLongLong(c,hashTypeLength(o));
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void hstrlenCommand(client *c) {
    robj *o;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_HASH)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    
    addReplyLongLong(c,hashTypeGetValueLength(o,c->argv[2]));

    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

static void addHashIteratorCursorToReply(client *c, hashTypeIterator *hi, int what) {
    if (hi->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *vstr = NULL;
        unsigned int vlen = UINT_MAX;
        long long vll = LLONG_MAX;

        hashTypeCurrentFromZiplist(hi, what, &vstr, &vlen, &vll);
        if (vstr) {
            addReplyBulkCBuffer(c, vstr, vlen);
        } else {
            addReplyBulkLongLong(c, vll);
        }

    } else if (hi->encoding == OBJ_ENCODING_HT) {
        robj *value;

        hashTypeCurrentFromHashTable(hi, what, &value);
        addReplyBulk(c, value);

    } else {
        serverPanic("Unknown hash encoding");
    }
}

void genericHgetallCommand(client *c, int flags) {
    robj *o;
    hashTypeIterator *hi;
    int multiplier = 0;
    int length, count = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.emptymultibulk)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_HASH)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    if (flags & OBJ_HASH_KEY) multiplier++;
    if (flags & OBJ_HASH_VALUE) multiplier++;

    length = hashTypeLength(o) * multiplier;
    addReplyMultiBulkLen(c, length);

    hi = hashTypeInitIterator(o);
    while (hashTypeNext(hi) != VR_ERROR) {
        if (flags & OBJ_HASH_KEY) {
            addHashIteratorCursorToReply(c, hi, OBJ_HASH_KEY);
            count++;
        }
        if (flags & OBJ_HASH_VALUE) {
            addHashIteratorCursorToReply(c, hi, OBJ_HASH_VALUE);
            count++;
        }
    }

    hashTypeReleaseIterator(hi);
    ASSERT(count == length);
    
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void hkeysCommand(client *c) {
    genericHgetallCommand(c,OBJ_HASH_KEY);
}

void hvalsCommand(client *c) {
    genericHgetallCommand(c,OBJ_HASH_VALUE);
}

void hgetallCommand(client *c) {
    genericHgetallCommand(c,OBJ_HASH_KEY|OBJ_HASH_VALUE);
}

void hexistsCommand(client *c) {
    robj *o;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_HASH)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    
    addReply(c, hashTypeExists(o,c->argv[2]) ? shared.cone : shared.czero);
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void hscanCommand(client *c) {
    scanGenericCommand(c,SCAN_TYPE_HASH);
}


================================================
FILE: src/vr_t_hash.h
================================================
#ifndef _VR_T_HASH_H_
#define _VR_T_HASH_H_

void hashTypeTryConversion(robj *o, robj **argv, int start, int end);
void hashTypeTryObjectEncoding(robj *subject, robj **o1, robj **o2);
int hashTypeGetFromZiplist(robj *o, robj *field, unsigned char **vstr, unsigned int *vlen, long long *vll);
int hashTypeGetFromHashTable(robj *o, robj *field, robj **value);
robj *hashTypeGetObject(robj *o, robj *field);
size_t hashTypeGetValueLength(robj *o, robj *field);
int hashTypeExists(robj *o, robj *field);
int hashTypeSet(robj *o, robj *field, robj *value);
int hashTypeDelete(robj *o, robj *field);
unsigned long hashTypeLength(robj *o);
hashTypeIterator *hashTypeInitIterator(robj *subject);
void hashTypeReleaseIterator(hashTypeIterator *hi);
int hashTypeNext(hashTypeIterator *hi);
void hashTypeCurrentFromZiplist(hashTypeIterator *hi, int what, unsigned char **vstr, unsigned int *vlen, long long *vll);
void hashTypeCurrentFromHashTable(hashTypeIterator *hi, int what, robj **dst);
robj *hashTypeCurrentObject(hashTypeIterator *hi, int what);
robj *hashTypeLookupWriteOrCreate(client *c, robj *key, int *expired);
void hashTypeConvertZiplist(robj *o, int enc);
void hashTypeConvert(robj *o, int enc);
void hsetCommand(client *c);
void hsetnxCommand(client *c);
void hmsetCommand(client *c);
void hincrbyCommand(client *c);
void hincrbyfloatCommand(client *c);
void hgetCommand(client *c);
void hmgetCommand(client *c);
void hdelCommand(client *c);
void hlenCommand(client *c);
void hstrlenCommand(client *c);
void genericHgetallCommand(client *c, int flags);
void hkeysCommand(client *c);
void hvalsCommand(client *c);
void hgetallCommand(client *c);
void hexistsCommand(client *c);
void hscanCommand(client *c);

#endif


================================================
FILE: src/vr_t_list.c
================================================
#include <vr_core.h>

/*-----------------------------------------------------------------------------
 * List API
 *----------------------------------------------------------------------------*/

/* The function pushes an element to the specified list object 'subject',
 * at head or tail position as specified by 'where'.
 *
 * There is no need for the caller to increment the refcount of 'value' as
 * the function takes care of it if needed. */
void listTypePush(robj *subject, robj *value, int where) {
    if (subject->encoding == OBJ_ENCODING_QUICKLIST) {
        robj *value_new;
        int pos = (where == LIST_HEAD) ? QUICKLIST_HEAD : QUICKLIST_TAIL;
        value_new = getDecodedObject(value);
        size_t len = sdslen(value_new->ptr);
        quicklistPush(subject->ptr, value_new->ptr, len, pos);
        if (value_new != value) freeObject(value_new);
    } else {
        serverPanic("Unknown list encoding");
    }
}

void *listPopSaver(unsigned char *data, unsigned int sz) {
    return createStringObject((char*)data,sz);
}

robj *listTypePop(robj *subject, int where) {
    long long vlong;
    robj *value = NULL;

    int ql_where = where == LIST_HEAD ? QUICKLIST_HEAD : QUICKLIST_TAIL;
    if (subject->encoding == OBJ_ENCODING_QUICKLIST) {
        if (quicklistPopCustom(subject->ptr, ql_where, (unsigned char **)&value,
                               NULL, &vlong, listPopSaver)) {
            if (!value)
                value = createStringObjectFromLongLong(vlong);
        }
    } else {
        serverPanic("Unknown list encoding");
    }
    return value;
}

unsigned long listTypeLength(robj *subject) {
    if (subject->encoding == OBJ_ENCODING_QUICKLIST) {
        return quicklistCount(subject->ptr);
    } else {
        serverPanic("Unknown list encoding");
    }
}

/* Initialize an iterator at the specified index. */
listTypeIterator *listTypeInitIterator(robj *subject, long index,
                                       unsigned char direction) {
    listTypeIterator *li = dalloc(sizeof(listTypeIterator));
    li->subject = subject;
    li->encoding = subject->encoding;
    li->direction = direction;
    li->iter = NULL;
    /* LIST_HEAD means start at TAIL and move *towards* head.
     * LIST_TAIL means start at HEAD and move *towards tail. */
    int iter_direction =
        direction == LIST_HEAD ? AL_START_TAIL : AL_START_HEAD;
    if (li->encoding == OBJ_ENCODING_QUICKLIST) {
        li->iter = quicklistGetIteratorAtIdx(li->subject->ptr,
                                             iter_direction, index);
    } else {
        serverPanic("Unknown list encoding");
    }
    return li;
}

/* Clean up the iterator. */
void listTypeReleaseIterator(listTypeIterator *li) {
    dfree(li->iter);
    dfree(li);
}

/* Stores pointer to current the entry in the provided entry structure
 * and advances the position of the iterator. Returns 1 when the current
 * entry is in fact an entry, 0 otherwise. */
int listTypeNext(listTypeIterator *li, listTypeEntry *entry) {
    /* Protect from converting when iterating */
    ASSERT(li->subject->encoding == li->encoding);

    entry->li = li;
    if (li->encoding == OBJ_ENCODING_QUICKLIST) {
        return quicklistNext(li->iter, &entry->entry);
    } else {
        serverPanic("Unknown list encoding");
    }
    return 0;
}

/* Return entry or NULL at the current position of the iterator. */
robj *listTypeGet(listTypeEntry *entry) {
    robj *value = NULL;
    if (entry->li->encoding == OBJ_ENCODING_QUICKLIST) {
        if (entry->entry.value) {
            value = createStringObject((char *)entry->entry.value,
                                       entry->entry.sz);
        } else {
            value = createStringObjectFromLongLong(entry->entry.longval);
        }
    } else {
        serverPanic("Unknown list encoding");
    }
    return value;
}

void listTypeInsert(listTypeEntry *entry, robj *value, int where) {
    if (entry->li->encoding == OBJ_ENCODING_QUICKLIST) {
        value = getDecodedObject(value);
        sds str = value->ptr;
        size_t len = sdslen(str);
        if (where == LIST_TAIL) {
            quicklistInsertAfter((quicklist *)entry->entry.quicklist,
                                 &entry->entry, str, len);
        } else if (where == LIST_HEAD) {
            quicklistInsertBefore((quicklist *)entry->entry.quicklist,
                                  &entry->entry, str, len);
        }
        decrRefCount(value);
    } else {
        serverPanic("Unknown list encoding");
    }
}

/* Compare the given object with the entry at the current position. */
int listTypeEqual(listTypeEntry *entry, robj *o) {
    if (entry->li->encoding == OBJ_ENCODING_QUICKLIST) {
        serverAssertWithInfo(NULL,o,sdsEncodedObject(o));
        return quicklistCompare(entry->entry.zi,o->ptr,sdslen(o->ptr));
    } else {
        serverPanic("Unknown list encoding");
    }
}

/* Delete the element pointed to. */
void listTypeDelete(listTypeIterator *iter, listTypeEntry *entry) {
    if (entry->li->encoding == OBJ_ENCODING_QUICKLIST) {
        quicklistDelEntry(iter->iter, &entry->entry);
    } else {
        serverPanic("Unknown list encoding");
    }
}

/* Create a quicklist from a single ziplist */
void listTypeConvert(robj *subject, int enc) {
    serverAssertWithInfo(NULL,subject,subject->type==OBJ_LIST);
    serverAssertWithInfo(NULL,subject,subject->encoding==OBJ_ENCODING_ZIPLIST);

    if (enc == OBJ_ENCODING_QUICKLIST) {
        size_t zlen = server.list_max_ziplist_size;
        int depth = server.list_compress_depth;
        subject->ptr = quicklistCreateFromZiplist(zlen, depth, subject->ptr);
        subject->encoding = OBJ_ENCODING_QUICKLIST;
    } else {
        serverPanic("Unsupported list conversion");
    }
}

/*-----------------------------------------------------------------------------
 * List Commands
 *----------------------------------------------------------------------------*/

void pushGenericCommand(client *c, int where) {
    int j, waiting = 0, pushed = 0;
    robj *lobj;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    lobj = lookupKeyWrite(c->db,c->argv[1],&expired);
    if (lobj && lobj->type != OBJ_LIST) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        addReply(c,shared.wrongtypeerr);
        return;
    }

    for (j = 2; j < c->argc; j++) {
        c->argv[j] = tryObjectEncoding(c->argv[j]);
        if (!lobj) {
            lobj = createQuicklistObject();
            quicklistSetOptions(lobj->ptr, server.list_max_ziplist_size,
                                server.list_compress_depth);
            dbAdd(c->db,c->argv[1],lobj);
        }
        listTypePush(lobj,c->argv[j],where);
        pushed++;
    }
    addReplyLongLong(c, waiting + (lobj ? listTypeLength(lobj) : 0));
    if (pushed) {
        char *event = (where == LIST_HEAD) ? "lpush" : "rpush";

        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_LIST,event,c->argv[1],c->db->id);
    }
    c->vel->dirty += pushed;

    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void lpushCommand(client *c) {
    pushGenericCommand(c,LIST_HEAD);
}

void rpushCommand(client *c) {
    pushGenericCommand(c,LIST_TAIL);
}

void pushxGenericCommand(client *c, robj *refval, robj *val, int where) {
    robj *subject;
    listTypeIterator *iter;
    listTypeEntry entry;
    int inserted = 0;

    if ((subject = lookupKeyWriteOrReply(c,c->argv[1],shared.czero,NULL)) == NULL ||
        checkType(c,subject,OBJ_LIST)) return;

    if (refval != NULL) {
        /* Seek refval from head to tail */
        iter = listTypeInitIterator(subject,0,LIST_TAIL);
        while (listTypeNext(iter,&entry)) {
            if (listTypeEqual(&entry,refval)) {
                listTypeInsert(&entry,val,where);
                inserted = 1;
                break;
            }
        }
        listTypeReleaseIterator(iter);

        if (inserted) {
            signalModifiedKey(c->db,c->argv[1]);
            notifyKeyspaceEvent(NOTIFY_LIST,"linsert",
                                c->argv[1],c->db->id);
            server.dirty++;
        } else {
            /* Notify client of a failed insert */
            addReply(c,shared.cnegone);
            return;
        }
    } else {
        char *event = (where == LIST_HEAD) ? "lpush" : "rpush";

        listTypePush(subject,val,where);
        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_LIST,event,c->argv[1],c->db->id);
        server.dirty++;
    }

    addReplyLongLong(c,listTypeLength(subject));
}

void lpushxCommand(client *c) {
    c->argv[2] = tryObjectEncoding(c->argv[2]);
    pushxGenericCommand(c,NULL,c->argv[2],LIST_HEAD);
}

void rpushxCommand(client *c) {
    c->argv[2] = tryObjectEncoding(c->argv[2]);
    pushxGenericCommand(c,NULL,c->argv[2],LIST_TAIL);
}

void linsertCommand(client *c) {
    c->argv[4] = tryObjectEncoding(c->argv[4]);
    if (strcasecmp(c->argv[2]->ptr,"after") == 0) {
        pushxGenericCommand(c,c->argv[3],c->argv[4],LIST_TAIL);
    } else if (strcasecmp(c->argv[2]->ptr,"before") == 0) {
        pushxGenericCommand(c,c->argv[3],c->argv[4],LIST_HEAD);
    } else {
        addReply(c,shared.syntaxerr);
    }
}

void llenCommand(client *c) {
    robj *o;
    
    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    o = lookupKeyReadOrReply(c,c->argv[1],shared.czero);
    if (o == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if(checkType(c,o,OBJ_LIST)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    addReplyLongLong(c,listTypeLength(o));
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void lindexCommand(client *c) {
    robj *o;
    long index;
    robj *value = NULL;

    if ((getLongFromObjectOrReply(c, c->argv[2], &index, NULL) != VR_OK))
        return;

    fetchInternalDbByKey(c,c->argv[1]);
    lockDbRead(c->db);
    o = lookupKeyReadOrReply(c,c->argv[1],shared.nullbulk);
    if (o == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if(checkType(c,o,OBJ_LIST)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    if (o->encoding == OBJ_ENCODING_QUICKLIST) {
        quicklistEntry entry;
        if (quicklistIndex(o->ptr, index, &entry)) {
            if (entry.value) {
                value = createStringObject((char*)entry.value,entry.sz);
            } else {
                value = createStringObjectFromLongLong(entry.longval);
            }
            addReplyBulk(c,value);
            freeObject(value);
        } else {
            addReply(c,shared.nullbulk);
        }
    } else {
        serverPanic("Unknown list encoding");
    }
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void lsetCommand(client *c) {
    robj *o;
    long index;
    robj *value = c->argv[3];
    int expired = 0;

    if ((getLongFromObjectOrReply(c, c->argv[2], &index, NULL) != VR_OK))
        return;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    o = lookupKeyWriteOrReply(c,c->argv[1],shared.nokeyerr,&expired);
    if (o == NULL || checkType(c,o,OBJ_LIST)) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }
    if (o->encoding == OBJ_ENCODING_QUICKLIST) {
        quicklist *ql = o->ptr;
        int replaced = quicklistReplaceAtIndex(ql, index,
                                               value->ptr, sdslen(value->ptr));
        if (!replaced) {
            addReply(c,shared.outofrangeerr);
        } else {
            addReply(c,shared.ok);
            signalModifiedKey(c->db,c->argv[1]);
            notifyKeyspaceEvent(NOTIFY_LIST,"lset",c->argv[1],c->db->id);
            c->vel->dirty++;
        }
    } else {
        serverPanic("Unknown list encoding");
    }

    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void popGenericCommand(client *c, int where) {
    robj *o, *value;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    o = lookupKeyWriteOrReply(c,c->argv[1],shared.nullbulk,&expired);
    if (o == NULL || checkType(c,o,OBJ_LIST)) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }

    value = listTypePop(o,where);
    if (value == NULL) {
        addReply(c,shared.nullbulk);
    } else {
        char *event = (where == LIST_HEAD) ? "lpop" : "rpop";

        addReplyBulk(c,value);
        freeObject(value);
        notifyKeyspaceEvent(NOTIFY_LIST,event,c->argv[1],c->db->id);
        if (listTypeLength(o) == 0) {
            notifyKeyspaceEvent(NOTIFY_GENERIC,"del",
                                c->argv[1],c->db->id);
            dbDelete(c->db,c->argv[1]);
        }
        signalModifiedKey(c->db,c->argv[1]);
        c->vel->dirty++;
    }
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void lpopCommand(client *c) {
    popGenericCommand(c,LIST_HEAD);
}

void rpopCommand(client *c) {
    popGenericCommand(c,LIST_TAIL);
}

void lrangeCommand(client *c) {
    robj *o;
    long start, end, llen, rangelen;

    if ((getLongFromObjectOrReply(c, c->argv[2], &start, NULL) != VR_OK) ||
        (getLongFromObjectOrReply(c, c->argv[3], &end, NULL) != VR_OK)) return;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.emptymultibulk)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_LIST)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    llen = listTypeLength(o);

    /* convert negative indexes */
    if (start < 0) start = llen+start;
    if (end < 0) end = llen+end;
    if (start < 0) start = 0;

    /* Invariant: start >= 0, so this test will be true when end < 0.
     * The range is empty when start > end or start >= length. */
    if (start > end || start >= llen) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        addReply(c,shared.emptymultibulk);
        return;
    }
    if (end >= llen) end = llen-1;
    rangelen = (end-start)+1;

    /* Return the result in form of a multi-bulk reply */
    addReplyMultiBulkLen(c,rangelen);
    if (o->encoding == OBJ_ENCODING_QUICKLIST) {
        listTypeIterator *iter = listTypeInitIterator(o, start, LIST_TAIL);

        while(rangelen--) {
            listTypeEntry entry;
            listTypeNext(iter, &entry);
            quicklistEntry *qe = &entry.entry;
            if (qe->value) {
                addReplyBulkCBuffer(c,qe->value,qe->sz);
            } else {
                addReplyBulkLongLong(c,qe->longval);
            }
        }
        listTypeReleaseIterator(iter);
    } else {
        serverPanic("List encoding is not QUICKLIST!");
    }

    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void ltrimCommand(client *c) {
    robj *o;
    long start, end, llen, ltrim, rtrim;
    int expired = 0;

    if ((getLongFromObjectOrReply(c, c->argv[2], &start, NULL) != VR_OK) ||
        (getLongFromObjectOrReply(c, c->argv[3], &end, NULL) != VR_OK)) return;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    if ((o = lookupKeyWriteOrReply(c,c->argv[1],shared.ok,&expired)) == NULL ||
        checkType(c,o,OBJ_LIST)) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
        return;
    }
    llen = listTypeLength(o);

    /* convert negative indexes */
    if (start < 0) start = llen+start;
    if (end < 0) end = llen+end;
    if (start < 0) start = 0;

    /* Invariant: start >= 0, so this test will be true when end < 0.
     * The range is empty when start > end or start >= length. */
    if (start > end || start >= llen) {
        /* Out of range start or start > end result in empty list */
        ltrim = llen;
        rtrim = 0;
    } else {
        if (end >= llen) end = llen-1;
        ltrim = start;
        rtrim = llen-end-1;
    }

    /* Remove list elements to perform the trim */
    if (o->encoding == OBJ_ENCODING_QUICKLIST) {
        quicklistDelRange(o->ptr,0,ltrim);
        quicklistDelRange(o->ptr,-rtrim,rtrim);
    } else {
        serverPanic("Unknown list encoding");
    }

    notifyKeyspaceEvent(NOTIFY_LIST,"ltrim",c->argv[1],c->db->id);
    if (listTypeLength(o) == 0) {
        dbDelete(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_GENERIC,"del",c->argv[1],c->db->id);
    }
    signalModifiedKey(c->db,c->argv[1]);
    c->vel->dirty++;
    addReply(c,shared.ok);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
}

void lremCommand(client *c) {
    robj *subject, *obj;
    obj = c->argv[3];
    long toremove;
    long removed = 0;
    int expired = 0;

    if ((getLongFromObjectOrReply(c, c->argv[2], &toremove, NULL) != VR_OK))
        return;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    subject = lookupKeyWriteOrReply(c,c->argv[1],shared.czero,&expired);
    if (subject == NULL || checkType(c,subject,OBJ_LIST)) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
        return;
    }
    listTypeIterator *li;
    if (toremove < 0) {
        toremove = -toremove;
        li = listTypeInitIterator(subject,-1,LIST_HEAD);
    } else {
        li = listTypeInitIterator(subject,0,LIST_TAIL);
    }

    listTypeEntry entry;
    while (listTypeNext(li,&entry)) {
        if (listTypeEqual(&entry,obj)) {
            listTypeDelete(li, &entry);
            c->vel->dirty++;
            removed++;
            if (toremove && removed == toremove) break;
        }
    }
    listTypeReleaseIterator(li);

    if (removed) {
        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_GENERIC,"lrem",c->argv[1],c->db->id);
    }

    if (listTypeLength(subject) == 0) {
        dbDelete(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_GENERIC,"del",c->argv[1],c->db->id);
    }

    addReplyLongLong(c,removed);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
}

/* This is the semantic of this command:
 *  RPOPLPUSH srclist dstlist:
 *    IF LLEN(srclist) > 0
 *      element = RPOP srclist
 *      LPUSH dstlist element
 *      RETURN element
 *    ELSE
 *      RETURN nil
 *    END
 *  END
 *
 * The idea is to be able to get an element from a list in a reliable way
 * since the element is not just returned but pushed against another list
 * as well. This command was originally proposed by Ezra Zygmuntowicz.
 */

void rpoplpushHandlePush(client *c, robj *dstkey, robj *dstobj, robj *value) {
    /* Create the list if the key does not exist */
    if (!dstobj) {
        dstobj = createQuicklistObject();
        quicklistSetOptions(dstobj->ptr, server.list_max_ziplist_size,
                            server.list_compress_depth);
        dbAdd(c->db,dstkey,dstobj);
    }
    signalModifiedKey(c->db,dstkey);
    listTypePush(dstobj,value,LIST_HEAD);
    notifyKeyspaceEvent(NOTIFY_LIST,"lpush",dstkey,c->db->id);
    /* Always send the pushed value to the client. */
    addReplyBulk(c,value);
}

void rpoplpushCommand(client *c) {
    robj *sobj, *value;
    if ((sobj = lookupKeyWriteOrReply(c,c->argv[1],shared.nullbulk,NULL)) == NULL ||
        checkType(c,sobj,OBJ_LIST)) return;

    if (listTypeLength(sobj) == 0) {
        /* This may only happen after loading very old RDB files. Recent
         * versions of Redis delete keys of empty lists. */
        addReply(c,shared.nullbulk);
    } else {
        robj *dobj = lookupKeyWrite(c->db,c->argv[2],NULL);
        robj *touchedkey = c->argv[1];

        if (dobj && checkType(c,dobj,OBJ_LIST)) return;
        value = listTypePop(sobj,LIST_TAIL);
        /* We saved touched key, and protect it, since rpoplpushHandlePush
         * may change the client command argument vector (it does not
         * currently). */
        incrRefCount(touchedkey);
        rpoplpushHandlePush(c,c->argv[2],dobj,value);

        /* listTypePop returns an object with its refcount incremented */
        decrRefCount(value);

        /* Delete the source list when it is empty */
        notifyKeyspaceEvent(NOTIFY_LIST,"rpop",touchedkey,c->db->id);
        if (listTypeLength(sobj) == 0) {
            dbDelete(c->db,touchedkey);
            notifyKeyspaceEvent(NOTIFY_GENERIC,"del",
                                touchedkey,c->db->id);
        }
        signalModifiedKey(c->db,touchedkey);
        decrRefCount(touchedkey);
        server.dirty++;
    }
}

/*-----------------------------------------------------------------------------
 * Blocking POP operations
 *----------------------------------------------------------------------------*/

/* This is how the current blocking POP works, we use BLPOP as example:
 * - If the user calls BLPOP and the key exists and contains a non empty list
 *   then LPOP is called instead. So BLPOP is semantically the same as LPOP
 *   if blocking is not required.
 * - If instead BLPOP is called and the key does not exists or the list is
 *   empty we need to block. In order to do so we remove the notification for
 *   new data to read in the client socket (so that we'll not serve new
 *   requests if the blocking request is not served). Also we put the client
 *   in a dictionary (db->blocking_keys) mapping keys to a list of clients
 *   blocking for this keys.
 * - If a PUSH operation against a key with blocked clients waiting is
 *   performed, we mark this key as "ready", and after the current command,
 *   MULTI/EXEC block, or script, is executed, we serve all the clients waiting
 *   for this list, from the one that blocked first, to the last, accordingly
 *   to the number of elements we have in the ready list.
 */

/* Set a client in blocking mode for the specified key, with the specified
 * timeout */
void blockForKeys(client *c, robj **keys, int numkeys, mstime_t timeout, robj *target) {
    dictEntry *de;
    dlist *l;
    int j;

    c->bpop.timeout = timeout;
    c->bpop.target = target;

    if (target != NULL) incrRefCount(target);

    for (j = 0; j < numkeys; j++) {
        /* If the key already exists in the dict ignore it. */
        if (dictAdd(c->bpop.keys,keys[j],NULL) != DICT_OK) continue;
        incrRefCount(keys[j]);

        /* And in the other "side", to map keys -> clients */
        de = dictFind(c->db->blocking_keys,keys[j]);
        if (de == NULL) {
            int retval;

            /* For every key we take a list of clients blocked for it */
            l = dlistCreate();
            retval = dictAdd(c->db->blocking_keys,keys[j],l);
            incrRefCount(keys[j]);
            serverAssertWithInfo(c,keys[j],retval == DICT_OK);
        } else {
            l = dictGetVal(de);
        }
        dlistAddNodeTail(l,c);
    }
    blockClient(c,BLOCKED_LIST);
}

/* Unblock a client that's waiting in a blocking operation such as BLPOP.
 * You should never call this function directly, but unblockClient() instead. */
void unblockClientWaitingData(client *c) {
    dictEntry *de;
    dictIterator *di;
    dlist *l;

    serverAssertWithInfo(c,NULL,dictSize(c->bpop.keys) != 0);
    di = dictGetIterator(c->bpop.keys);
    /* The client may wait for multiple keys, so unblock it for every key. */
    while((de = dictNext(di)) != NULL) {
        robj *key = dictGetKey(de);

        /* Remove this client from the list of clients waiting for this key. */
        l = dictFetchValue(c->db->blocking_keys,key);
        serverAssertWithInfo(c,key,l != NULL);
        dlistDelNode(l,dlistSearchKey(l,c));
        /* If the list is empty we need to remove it to avoid wasting memory */
        if (dlistLength(l) == 0)
            dictDelete(c->db->blocking_keys,key);
    }
    dictReleaseIterator(di);

    /* Cleanup the client structure */
    dictEmpty(c->bpop.keys,NULL);
    if (c->bpop.target) {
        decrRefCount(c->bpop.target);
        c->bpop.target = NULL;
    }
}

/* If the specified key has clients blocked waiting for list pushes, this
 * function will put the key reference into the server.ready_keys list.
 * Note that db->ready_keys is a hash table that allows us to avoid putting
 * the same key again and again in the list in case of multiple pushes
 * made by a script or in the context of MULTI/EXEC.
 *
 * The list will be finally processed by handleClientsBlockedOnLists() */
void signalListAsReady(redisDb *db, robj *key) {
    int ret;
    readyList *rl;

    /* No clients blocking for this key? No need to queue it. */
    if (dictFind(db->blocking_keys,key) == NULL) return;

    /* Key was already signaled? No need to queue it again. */
    if (dictFind(db->ready_keys,key) != NULL) return;

    /* Ok, we need to queue this key into server.ready_keys. */
    rl = dalloc(sizeof(*rl));
    rl->key = key;
    rl->db = db;
    incrRefCount(key);
    dlistAddNodeTail(server.ready_keys,rl);

    /* We also add the key in the db->ready_keys dictionary in order
     * to avoid adding it multiple times into a list with a simple O(1)
     * check. */
    incrRefCount(key);
    ret = dictAdd(db->ready_keys,key,NULL);
    ASSERT(ret == DICT_OK);
}

/* This is a helper function for handleClientsBlockedOnLists(). It's work
 * is to serve a specific client (receiver) that is blocked on 'key'
 * in the context of the specified 'db', doing the following:
 *
 * 1) Provide the client with the 'value' element.
 * 2) If the dstkey is not NULL (we are serving a BRPOPLPUSH) also push the
 *    'value' element on the destination list (the LPUSH side of the command).
 * 3) Propagate the resulting BRPOP, BLPOP and additional LPUSH if any into
 *    the AOF and replication channel.
 *
 * The argument 'where' is LIST_TAIL or LIST_HEAD, and indicates if the
 * 'value' element was popped fron the head (BLPOP) or tail (BRPOP) so that
 * we can propagate the command properly.
 *
 * The function returns VR_OK if we are able to serve the client, otherwise
 * VR_ERROR is returned to signal the caller that the list POP operation
 * should be undone as the client was not served: This only happens for
 * BRPOPLPUSH that fails to push the value to the destination key as it is
 * of the wrong type. */
int serveClientBlockedOnList(client *receiver, robj *key, robj *dstkey, redisDb *db, robj *value, int where)
{
    robj *argv[3];

    if (dstkey == NULL) {
        /* Propagate the [LR]POP operation. */
        argv[0] = (where == LIST_HEAD) ? shared.lpop :
                                          shared.rpop;
        argv[1] = key;
        propagate((where == LIST_HEAD) ?
            server.lpopCommand : server.rpopCommand,
            db->id,argv,2,PROPAGATE_AOF|PROPAGATE_REPL);

        /* BRPOP/BLPOP */
        addReplyMultiBulkLen(receiver,2);
        addReplyBulk(receiver,key);
        addReplyBulk(receiver,value);
    } else {
        /* BRPOPLPUSH */
        robj *dstobj =
            lookupKeyWrite(receiver->db,dstkey,NULL);
        if (!(dstobj &&
             checkType(receiver,dstobj,OBJ_LIST)))
        {
            /* Propagate the RPOP operation. */
            argv[0] = shared.rpop;
            argv[1] = key;
            propagate(server.rpopCommand,
                db->id,argv,2,
                PROPAGATE_AOF|
                PROPAGATE_REPL);
            rpoplpushHandlePush(receiver,dstkey,dstobj,
                value);
            /* Propagate the LPUSH operation. */
            argv[0] = shared.lpush;
            argv[1] = dstkey;
            argv[2] = value;
            propagate(server.lpushCommand,
                db->id,argv,3,
                PROPAGATE_AOF|
                PROPAGATE_REPL);
        } else {
            /* BRPOPLPUSH failed because of wrong
             * destination type. */
            return VR_ERROR;
        }
    }
    return VR_OK;
}

/* This function should be called by Redis every time a single command,
 * a MULTI/EXEC block, or a Lua script, terminated its execution after
 * being called by a client.
 *
 * All the keys with at least one client blocked that received at least
 * one new element via some PUSH operation are accumulated into
 * the server.ready_keys list. This function will run the list and will
 * serve clients accordingly. Note that the function will iterate again and
 * again as a result of serving BRPOPLPUSH we can have new blocking clients
 * to serve because of the PUSH side of BRPOPLPUSH. */
void handleClientsBlockedOnLists(void) {
    while(dlistLength(server.ready_keys) != 0) {
        dlist *l;

        /* Point server.ready_keys to a fresh list and save the current one
         * locally. This way as we run the old list we are free to call
         * signalListAsReady() that may push new elements in server.ready_keys
         * when handling clients blocked into BRPOPLPUSH. */
        l = server.ready_keys;
        server.ready_keys = dlistCreate();

        while(dlistLength(l) != 0) {
            dlistNode *ln = dlistFirst(l);
            readyList *rl = ln->value;

            /* First of all remove this key from db->ready_keys so that
             * we can safely call signalListAsReady() against this key. */
            dictDelete(rl->db->ready_keys,rl->key);

            /* If the key exists and it's a list, serve blocked clients
             * with data. */
            robj *o = lookupKeyWrite(rl->db,rl->key,NULL);
            if (o != NULL && o->type == OBJ_LIST) {
                dictEntry *de;

                /* We serve clients in the same order they blocked for
                 * this key, from the first blocked to the last. */
                de = dictFind(rl->db->blocking_keys,rl->key);
                if (de) {
                    dlist *clients = dictGetVal(de);
                    int numclients = dlistLength(clients);

                    while(numclients--) {
                        dlistNode *clientnode = dlistFirst(clients);
                        client *receiver = clientnode->value;
                        robj *dstkey = receiver->bpop.target;
                        int where = (receiver->lastcmd &&
                                     receiver->lastcmd->proc == blpopCommand) ?
                                    LIST_HEAD : LIST_TAIL;
                        robj *value = listTypePop(o,where);

                        if (value) {
                            /* Protect receiver->bpop.target, that will be
                             * freed by the next unblockClient()
                             * call. */
                            if (dstkey) incrRefCount(dstkey);
                            unblockClient(receiver);

                            if (serveClientBlockedOnList(receiver,
                                rl->key,dstkey,rl->db,value,
                                where) == VR_ERROR)
                            {
                                /* If we failed serving the client we need
                                 * to also undo the POP operation. */
                                    listTypePush(o,value,where);
                            }

                            if (dstkey) decrRefCount(dstkey);
                            decrRefCount(value);
                        } else {
                            break;
                        }
                    }
                }

                if (listTypeLength(o) == 0) {
                    dbDelete(rl->db,rl->key);
                }
                /* We don't call signalModifiedKey() as it was already called
                 * when an element was pushed on the list. */
            }

            /* Free this item. */
            decrRefCount(rl->key);
            dfree(rl);
            dlistDelNode(l,ln);
        }
        dlistRelease(l); /* We have the new list on place at this point. */
    }
}

/* Blocking RPOP/LPOP */
void blockingPopGenericCommand(client *c, int where) {
    robj *o;
    mstime_t timeout;
    int j;

    if (getTimeoutFromObjectOrReply(c,c->argv[c->argc-1],&timeout,UNIT_SECONDS)
        != VR_OK) return;

    for (j = 1; j < c->argc-1; j++) {
        o = lookupKeyWrite(c->db,c->argv[j],NULL);
        if (o != NULL) {
            if (o->type != OBJ_LIST) {
                addReply(c,shared.wrongtypeerr);
                return;
            } else {
                if (listTypeLength(o) != 0) {
                    /* Non empty list, this is like a non normal [LR]POP. */
                    char *event = (where == LIST_HEAD) ? "lpop" : "rpop";
                    robj *value = listTypePop(o,where);
                    ASSERT(value != NULL);

                    addReplyMultiBulkLen(c,2);
                    addReplyBulk(c,c->argv[j]);
                    addReplyBulk(c,value);
                    decrRefCount(value);
                    notifyKeyspaceEvent(NOTIFY_LIST,event,
                                        c->argv[j],c->db->id);
                    if (listTypeLength(o) == 0) {
                        dbDelete(c->db,c->argv[j]);
                        notifyKeyspaceEvent(NOTIFY_GENERIC,"del",
                                            c->argv[j],c->db->id);
                    }
                    signalModifiedKey(c->db,c->argv[j]);
                    server.dirty++;

                    /* Replicate it as an [LR]POP instead of B[LR]POP. */
                    rewriteClientCommandVector(c,2,
                        (where == LIST_HEAD) ? shared.lpop : shared.rpop,
                        c->argv[j]);
                    return;
                }
            }
        }
    }

    /* If we are inside a MULTI/EXEC and the list is empty the only thing
     * we can do is treating it as a timeout (even with timeout 0). */
    if (c->flags & CLIENT_MULTI) {
        addReply(c,shared.nullmultibulk);
        return;
    }

    /* If the list is empty or the key does not exists we must block */
    blockForKeys(c, c->argv + 1, c->argc - 2, timeout, NULL);
}

void blpopCommand(client *c) {
    blockingPopGenericCommand(c,LIST_HEAD);
}

void brpopCommand(client *c) {
    blockingPopGenericCommand(c,LIST_TAIL);
}

void brpoplpushCommand(client *c) {
    mstime_t timeout;

    if (getTimeoutFromObjectOrReply(c,c->argv[3],&timeout,UNIT_SECONDS)
        != VR_OK) return;

    robj *key = lookupKeyWrite(c->db, c->argv[1],NULL);

    if (key == NULL) {
        if (c->flags & CLIENT_MULTI) {
            /* Blocking against an empty list in a multi state
             * returns immediately. */
            addReply(c, shared.nullbulk);
        } else {
            /* The list is empty and the client blocks. */
            blockForKeys(c, c->argv + 1, 1, timeout, c->argv[2]);
        }
    } else {
        if (key->type != OBJ_LIST) {
            addReply(c, shared.wrongtypeerr);
        } else {
            /* The list exists and has elements, so
             * the regular rpoplpushCommand is executed. */
            serverAssertWithInfo(c,key,listTypeLength(key) > 0);
            rpoplpushCommand(c);
        }
    }
}


================================================
FILE: src/vr_t_list.h
================================================
#ifndef _VR_T_LIST_H_
#define _VR_T_LIST_H_

void listTypePush(robj *subject, robj *value, int where);
void *listPopSaver(unsigned char *data, unsigned int sz);
robj *listTypePop(robj *subject, int where);
unsigned long listTypeLength(robj *subject);
listTypeIterator *listTypeInitIterator(robj *subject, long index, unsigned char direction);
void listTypeReleaseIterator(listTypeIterator *li);
int listTypeNext(listTypeIterator *li, listTypeEntry *entry);
robj *listTypeGet(listTypeEntry *entry);
void listTypeInsert(listTypeEntry *entry, robj *value, int where);
int listTypeEqual(listTypeEntry *entry, robj *o);
void listTypeDelete(listTypeIterator *iter, listTypeEntry *entry);
void listTypeConvert(robj *subject, int enc);
void pushGenericCommand(client *c, int where);
void lpushCommand(client *c);
void rpushCommand(client *c);
void pushxGenericCommand(client *c, robj *refval, robj *val, int where);
void lpushxCommand(client *c);
void rpushxCommand(client *c);
void linsertCommand(client *c);
void llenCommand(client *c);
void lindexCommand(client *c);
void lsetCommand(client *c);
void popGenericCommand(client *c, int where);
void lpopCommand(client *c);
void rpopCommand(client *c);
void lrangeCommand(client *c);
void ltrimCommand(client *c);
void lremCommand(client *c);
void rpoplpushHandlePush(client *c, robj *dstkey, robj *dstobj, robj *value);
void rpoplpushCommand(client *c);
void blockForKeys(client *c, robj **keys, int numkeys, mstime_t timeout, robj *target);
void unblockClientWaitingData(client *c);
void signalListAsReady(redisDb *db, robj *key);
int serveClientBlockedOnList(client *receiver, robj *key, robj *dstkey, redisDb *db, robj *value, int where);
void handleClientsBlockedOnLists(void);
void blockingPopGenericCommand(client *c, int where);
void blpopCommand(client *c);
void brpopCommand(client *c);
void brpoplpushCommand(client *c);

#endif


================================================
FILE: src/vr_t_set.c
================================================
#include <vr_core.h>

/*-----------------------------------------------------------------------------
 * Set Commands
 *----------------------------------------------------------------------------*/

void sunionDiffGenericCommand(client *c, robj **setkeys, int setnum,
                              robj *dstkey, int op);

/* Factory method to return a set that *can* hold "value". When the object has
 * an integer-encodable value, an intset will be returned. Otherwise a regular
 * hash table. */
robj *setTypeCreate(robj *value) {
    if (isObjectRepresentableAsLongLong(value,NULL) == VR_OK)
        return createIntsetObject();
    return createSetObject();
}

/* Add the specified value into a set. The function takes care of incrementing
 * the reference count of the object if needed in order to retain a copy.
 *
 * If the value was already member of the set, nothing is done and 0 is
 * returned, otherwise the new element is added and 1 is returned. */
int setTypeAdd(robj *subject, robj *value) {
    long long llval;
    robj *obj;
    if (subject->encoding == OBJ_ENCODING_HT) {
        obj = dupStringObjectUnconstant(value);
        if (dictAdd(subject->ptr,obj,NULL) == DICT_OK) {
            return 1;
        } else {
            freeObject(obj);
        }
    } else if (subject->encoding == OBJ_ENCODING_INTSET) {
        if (isObjectRepresentableAsLongLong(value,&llval) == VR_OK) {
            uint8_t success = 0;
            subject->ptr = intsetAdd(subject->ptr,llval,&success);
            if (success) {
                /* Convert to regular set when the intset contains
                 * too many entries. */
                if (intsetLen(subject->ptr) > server.set_max_intset_entries)
                    setTypeConvert(subject,OBJ_ENCODING_HT);
                return 1;
            }
        } else {
            /* Failed to get integer from object, convert to regular set. */
            setTypeConvert(subject,OBJ_ENCODING_HT);
            obj = dupStringObjectUnconstant(value);
            /* The set *was* an intset and this value is not integer
             * encodable, so dictAdd should always work. */
            serverAssertWithInfo(NULL,obj,
                dictAdd(subject->ptr,obj,NULL) == DICT_OK);
            return 1;
        }
    } else {
        serverPanic("Unknown set encoding");
    }
    return 0;
}

int setTypeRemove(robj *setobj, robj *value) {
    long long llval;
    if (setobj->encoding == OBJ_ENCODING_HT) {
        if (dictDelete(setobj->ptr,value) == DICT_OK) {
            if (htNeedsResize(setobj->ptr)) dictResize(setobj->ptr);
            return 1;
        }
    } else if (setobj->encoding == OBJ_ENCODING_INTSET) {
        if (isObjectRepresentableAsLongLong(value,&llval) == VR_OK) {
            int success;
            setobj->ptr = intsetRemove(setobj->ptr,llval,&success);
            if (success) return 1;
        }
    } else {
        serverPanic("Unknown set encoding");
    }
    return 0;
}

int setTypeIsMember(robj *subject, robj *value) {
    long long llval;
    if (subject->encoding == OBJ_ENCODING_HT) {
        return dictFind((dict*)subject->ptr,value) != NULL;
    } else if (subject->encoding == OBJ_ENCODING_INTSET) {
        if (isObjectRepresentableAsLongLong(value,&llval) == VR_OK) {
            return intsetFind((intset*)subject->ptr,llval);
        }
    } else {
        serverPanic("Unknown set encoding");
    }
    return 0;
}

setTypeIterator *setTypeInitIterator(robj *subject) {
    setTypeIterator *si = dalloc(sizeof(setTypeIterator));
    si->subject = subject;
    si->encoding = subject->encoding;
    if (si->encoding == OBJ_ENCODING_HT) {
        si->di = dictGetIterator(subject->ptr);
    } else if (si->encoding == OBJ_ENCODING_INTSET) {
        si->ii = 0;
    } else {
        serverPanic("Unknown set encoding");
    }
    return si;
}

void setTypeReleaseIterator(setTypeIterator *si) {
    if (si->encoding == OBJ_ENCODING_HT)
        dictReleaseIterator(si->di);
    dfree(si);
}

/* Move to the next entry in the set. Returns the object at the current
 * position.
 *
 * Since set elements can be internally be stored as redis objects or
 * simple arrays of integers, setTypeNext returns the encoding of the
 * set object you are iterating, and will populate the appropriate pointer
 * (objele) or (llele) accordingly.
 *
 * Note that both the objele and llele pointers should be passed and cannot
 * be NULL since the function will try to defensively populate the non
 * used field with values which are easy to trap if misused.
 *
 * When there are no longer elements -1 is returned.
 * Returned objects ref count is not incremented, so this function is
 * copy on write friendly. */
int setTypeNext(setTypeIterator *si, robj **objele, int64_t *llele) {
    if (si->encoding == OBJ_ENCODING_HT) {
        dictEntry *de = dictNext(si->di);
        if (de == NULL) return -1;
        *objele = dictGetKey(de);
        *llele = -123456789; /* Not needed. Defensive. */
    } else if (si->encoding == OBJ_ENCODING_INTSET) {
        if (!intsetGet(si->subject->ptr,si->ii++,llele))
            return -1;
        *objele = NULL; /* Not needed. Defensive. */
    } else {
        serverPanic("Wrong set encoding in setTypeNext");
    }
    return si->encoding;
}

/* The not copy on write friendly version but easy to use version
 * of setTypeNext() is setTypeNextObject(), returning new objects
 * or the returned objects. So if you don't
 * retain a pointer to this object you should call freeObject() against 
 * it if  si->encoding == OBJ_ENCODING_INTSET.
 *
 * This function is the way to go for write operations where COW is not
 * an issue as the result will be anyway of incrementing the ref count. */
robj *setTypeNextObject(setTypeIterator *si) {
    int64_t intele;
    robj *objele;
    int encoding;

    encoding = setTypeNext(si,&objele,&intele);
    switch(encoding) {
        case -1:    return NULL;
        case OBJ_ENCODING_INTSET:
            return createStringObjectFromLongLong(intele);
        case OBJ_ENCODING_HT:
            return objele;
        default:
            serverPanic("Unsupported encoding");
    }
    return NULL; /* just to suppress warnings */
}

/* Return random element from a non empty set.
 * The returned element can be a int64_t value if the set is encoded
 * as an "intset" blob of integers, or a redis object if the set
 * is a regular set.
 *
 * The caller provides both pointers to be populated with the right
 * object. The return value of the function is the object->encoding
 * field of the object and is used by the caller to check if the
 * int64_t pointer or the redis object pointer was populated.
 *
 * Note that both the objele and llele pointers should be passed and cannot
 * be NULL since the function will try to defensively populate the non
 * used field with values which are easy to trap if misused.
 *
 * When an object is returned (the set was a real set) the ref count
 * of the object is not incremented so this function can be considered
 * copy on write friendly. */
int setTypeRandomElement(robj *setobj, robj **objele, int64_t *llele) {
    if (setobj->encoding == OBJ_ENCODING_HT) {
        dictEntry *de = dictGetRandomKey(setobj->ptr);
        *objele = dictGetKey(de);
        *llele = -123456789; /* Not needed. Defensive. */
    } else if (setobj->encoding == OBJ_ENCODING_INTSET) {
        *llele = intsetRandom(setobj->ptr);
        *objele = NULL; /* Not needed. Defensive. */
    } else {
        serverPanic("Unknown set encoding");
    }
    return setobj->encoding;
}

unsigned long setTypeSize(robj *subject) {
    if (subject->encoding == OBJ_ENCODING_HT) {
        return dictSize((dict*)subject->ptr);
    } else if (subject->encoding == OBJ_ENCODING_INTSET) {
        return intsetLen((intset*)subject->ptr);
    } else {
        serverPanic("Unknown set encoding");
    }
}

/* Convert the set to specified encoding. The resulting dict (when converting
 * to a hash table) is presized to hold the number of elements in the original
 * set. */
void setTypeConvert(robj *setobj, int enc) {
    setTypeIterator *si;
    serverAssertWithInfo(NULL,setobj,setobj->type == OBJ_SET &&
                             setobj->encoding == OBJ_ENCODING_INTSET);

    if (enc == OBJ_ENCODING_HT) {
        int64_t intele;
        dict *d = dictCreate(&setDictType,NULL);
        robj *element;

        /* Presize the dict to avoid rehashing */
        dictExpand(d,intsetLen(setobj->ptr));

        /* To add the elements we extract integers and create redis objects */
        si = setTypeInitIterator(setobj);
        while (setTypeNext(si,&element,&intele) != -1) {
            element = createStringObjectFromLongLong(intele);
            serverAssertWithInfo(NULL,element,
                dictAdd(d,element,NULL) == DICT_OK);
        }
        setTypeReleaseIterator(si);

        setobj->encoding = OBJ_ENCODING_HT;
        dfree(setobj->ptr);
        setobj->ptr = d;
    } else {
        serverPanic("Unsupported set conversion");
    }
}

void saddCommand(client *c) {
    robj *set;
    int j, added = 0;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    set = lookupKeyWrite(c->db,c->argv[1],&expired);
    if (set == NULL) {
        set = setTypeCreate(c->argv[2]);
        dbAdd(c->db,c->argv[1],set);
    } else {
        if (set->type != OBJ_SET) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            addReply(c,shared.wrongtypeerr);
            return;
        }
    }

    for (j = 2; j < c->argc; j++) {
        c->argv[j] = tryObjectEncoding(c->argv[j]);
        if (setTypeAdd(set,c->argv[j])) added++;
    }
    if (added) {
        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_SET,"sadd",c->argv[1],c->db->id);
    }
    c->vel->dirty += added;
    addReplyLongLong(c,added);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void sremCommand(client *c) {
    robj *set;
    int j, deleted = 0, keyremoved = 0;
    int expired = 0;
    
    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    if ((set = lookupKeyWriteOrReply(c,c->argv[1],shared.czero,&expired)) == NULL ||
        checkType(c,set,OBJ_SET)) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }

    for (j = 2; j < c->argc; j++) {
        if (setTypeRemove(set,c->argv[j])) {
            deleted++;
            if (setTypeSize(set) == 0) {
                dbDelete(c->db,c->argv[1]);
                keyremoved = 1;
                break;
            }
        }
    }
    if (deleted) {
        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_SET,"srem",c->argv[1],c->db->id);
        if (keyremoved)
            notifyKeyspaceEvent(NOTIFY_GENERIC,"del",c->argv[1],
                                c->db->id);
        c->vel->dirty += deleted;
    }
    addReplyLongLong(c,deleted);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void smoveCommand(client *c) {
    robj *srcset, *dstset, *ele;
    srcset = lookupKeyWrite(c->db,c->argv[1],NULL);
    dstset = lookupKeyWrite(c->db,c->argv[2],NULL);
    ele = c->argv[3] = tryObjectEncoding(c->argv[3]);

    /* If the source key does not exist return 0 */
    if (srcset == NULL) {
        addReply(c,shared.czero);
        return;
    }

    /* If the source key has the wrong type, or the destination key
     * is set and has the wrong type, return with an error. */
    if (checkType(c,srcset,OBJ_SET) ||
        (dstset && checkType(c,dstset,OBJ_SET))) return;

    /* If srcset and dstset are equal, SMOVE is a no-op */
    if (srcset == dstset) {
        addReply(c,setTypeIsMember(srcset,ele) ? shared.cone : shared.czero);
        return;
    }

    /* If the element cannot be removed from the src set, return 0. */
    if (!setTypeRemove(srcset,ele)) {
        addReply(c,shared.czero);
        return;
    }
    notifyKeyspaceEvent(NOTIFY_SET,"srem",c->argv[1],c->db->id);

    /* Remove the src set from the database when empty */
    if (setTypeSize(srcset) == 0) {
        dbDelete(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_GENERIC,"del",c->argv[1],c->db->id);
    }
    signalModifiedKey(c->db,c->argv[1]);
    signalModifiedKey(c->db,c->argv[2]);
    server.dirty++;

    /* Create the destination set when it doesn't exist */
    if (!dstset) {
        dstset = setTypeCreate(ele);
        dbAdd(c->db,c->argv[2],dstset);
    }

    /* An extra key has changed when ele was successfully added to dstset */
    if (setTypeAdd(dstset,ele)) {
        server.dirty++;
        notifyKeyspaceEvent(NOTIFY_SET,"sadd",c->argv[2],c->db->id);
    }
    addReply(c,shared.cone);
}

void sismemberCommand(client *c) {
    robj *set;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((set = lookupKeyReadOrReply(c,c->argv[1],shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,set,OBJ_SET)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    
    c->argv[2] = tryObjectEncoding(c->argv[2]);
    if (setTypeIsMember(set,c->argv[2]))
        addReply(c,shared.cone);
    else
        addReply(c,shared.czero);

    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void scardCommand(client *c) {
    robj *o;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_SET)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    
    addReplyLongLong(c,setTypeSize(o));
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void smembersGenericCommand(client *c, robj *set)
{
    setTypeIterator *si;
    robj *eleobj;
    int64_t intobj;
    int encoding;
    
    addReplyMultiBulkLen(c, setTypeSize(set));
    si = setTypeInitIterator(set);
    while ((encoding = setTypeNext(si,&eleobj,&intobj)) != -1) {
        if (encoding == OBJ_ENCODING_HT) {
            addReplyBulk(c, eleobj);
        } else if (encoding == OBJ_ENCODING_INTSET) {
            addReplyBulkLongLong(c, intobj);
        }
    }
    setTypeReleaseIterator(si);
}

/* Handle the "SPOP key <count>" variant. The normal version of the
 * command is handled by the spopCommand() function itself. */

/* How many times bigger should be the set compared to the remaining size
 * for us to use the "create new set" strategy? Read later in the
 * implementation for more info. */
#define SPOP_MOVE_STRATEGY_MUL 5

void spopWithCountCommand(client *c) {
    long l;
    unsigned long count, size;
    robj *set;
    int expired = 0;

    /* Get the count argument */
    if (getLongFromObjectOrReply(c,c->argv[2],&l,NULL) != VR_OK) return;
    if (l >= 0) {
        count = (unsigned) l;
    } else {
        addReply(c,shared.outofrangeerr);
        return;
    }

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    /* Make sure a key with the name inputted exists, and that it's type is
     * indeed a set. Otherwise, return nil */
    if ((set = lookupKeyWriteOrReply(c,c->argv[1],shared.emptymultibulk,&expired))
        == NULL || checkType(c,set,OBJ_SET)) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }

    /* If count is zero, serve an empty multibulk ASAP to avoid special
     * cases later. */
    if (count == 0) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        addReply(c,shared.emptymultibulk);
        return;
    }

    size = setTypeSize(set);

    /* Generate an SPOP keyspace notification */
    notifyKeyspaceEvent(NOTIFY_SET,"spop",c->argv[1],c->db->id);
    c->vel->dirty += count;

    /* CASE 1:
     * The number of requested elements is greater than or equal to
     * the number of elements inside the set: simply return the whole set. */
    if (count >= size) {
        robj *aux;
        
        /* We just return the entire set */
        smembersGenericCommand(c, set);

        /* Delete the set as it is now empty */
        dbDelete(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_GENERIC,"del",c->argv[1],c->db->id);

        /* Propagate this command as an DEL operation */
        aux = dupStringObjectUnconstant(c->argv[1]);
        rewriteClientCommandVector(c,2,shared.del,aux);
        signalModifiedKey(c->db,c->argv[1]);
        c->vel->dirty++;
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }

    /* Case 2 and 3 require to replicate SPOP as a set of SERM commands.
     * Prepare our replication argument vector. Also send the array length
     * which is common to both the code paths. */
    robj *propargv[3];
    propargv[0] = createStringObject("SREM",4);
    propargv[1] = c->argv[1];
    addReplyMultiBulkLen(c,count);

    /* Common iteration vars. */
    robj *objele;
    int encoding;
    int64_t llele;
    unsigned long remaining = size-count; /* Elements left after SPOP. */

    /* If we are here, the number of requested elements is less than the
     * number of elements inside the set. Also we are sure that count < size.
     * Use two different strategies.
     *
     * CASE 2: The number of elements to return is small compared to the
     * set size. We can just extract random elements and return them to
     * the set. */
    if (remaining*SPOP_MOVE_STRATEGY_MUL > count) {
        while(count--) {
            encoding = setTypeRandomElement(set,&objele,&llele);
            if (encoding == OBJ_ENCODING_INTSET) {
                objele = createStringObjectFromLongLong(llele);
            } else {
                objele = dupStringObjectUnconstant(objele);
            }

            /* Return the element to the client and remove from the set. */
            addReplyBulk(c,objele);
            setTypeRemove(set,objele);

            /* Replicate/AOF this command as an SREM operation */
            propargv[2] = objele;
            alsoPropagate(server.sremCommand,c->db->id,propargv,3,
                PROPAGATE_AOF|PROPAGATE_REPL);
            freeObject(objele);
        }
    } else {
    /* CASE 3: The number of elements to return is very big, approaching
     * the size of the set itself. After some time extracting random elements
     * from such a set becomes computationally expensive, so we use
     * a different strategy, we extract random elements that we don't
     * want to return (the elements that will remain part of the set),
     * creating a new set as we do this (that will be stored as the original
     * set). Then we return the elements left in the original set and
     * release it. */
        robj *newset = NULL;

        /* Create a new set with just the remaining elements. */
        while(remaining--) {
            encoding = setTypeRandomElement(set,&objele,&llele);
            if (encoding == OBJ_ENCODING_INTSET)
                objele = createStringObjectFromLongLong(llele);
            
            if (!newset) newset = setTypeCreate(objele);
            setTypeAdd(newset,objele);
            setTypeRemove(set,objele);
            if (encoding == OBJ_ENCODING_INTSET)
                freeObject(objele);
        }

        /* Tranfer the old set to the client. */
        setTypeIterator *si;
        si = setTypeInitIterator(set);
        while((encoding = setTypeNext(si,&objele,&llele)) != -1) {
            if (encoding == OBJ_ENCODING_INTSET)
                objele = createStringObjectFromLongLong(llele);
            addReplyBulk(c,objele);

            /* Replicate/AOF this command as an SREM operation */
            propargv[2] = objele;
            alsoPropagate(server.sremCommand,c->db->id,propargv,3,
                PROPAGATE_AOF|PROPAGATE_REPL);
            if (encoding == OBJ_ENCODING_INTSET)
                freeObject(objele);
        }
        setTypeReleaseIterator(si);

        /* Assign the new set as the key value. */
        dbOverwrite(c->db,c->argv[1],newset);
    }

    /* Don't propagate the command itself even if we incremented the
     * dirty counter. We don't want to propagate an SPOP command since
     * we propagated the command as a set of SREMs operations using
     * the alsoPropagate() API. */
    freeObject(propargv[0]);
    preventCommandPropagation(c);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void spopCommand(client *c) {
    robj *set, *ele, *aux1, *aux2;
    int64_t llele;
    int encoding;
    int expired = 0;

    if (c->argc == 3) {
        spopWithCountCommand(c);
        return;
    } else if (c->argc > 3) {
        addReply(c,shared.syntaxerr);
        return;
    }

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    /* Make sure a key with the name inputted exists, and that it's type is
     * indeed a set */
    if ((set = lookupKeyWriteOrReply(c,c->argv[1],shared.nullbulk,&expired)) == NULL ||
        checkType(c,set,OBJ_SET)) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }
    
    /* Get a random element from the set */
    encoding = setTypeRandomElement(set,&ele,&llele);

    /* Remove the element from the set */
    if (encoding == OBJ_ENCODING_INTSET) {
        ele = createStringObjectFromLongLong(llele);
        set->ptr = intsetRemove(set->ptr,llele,NULL);
    } else {
        ele = dupStringObjectUnconstant(ele);
        setTypeRemove(set,ele);
    }

    notifyKeyspaceEvent(NOTIFY_SET,"spop",c->argv[1],c->db->id);

    /* Replicate/AOF this command as an SREM operation */
    aux1 = createStringObject("SREM",4);
    aux2 = dupStringObjectUnconstant(c->argv[1]);
    rewriteClientCommandVector(c,3,aux1,aux2,ele);

    /* Add the element to the reply */
    addReplyBulk(c,ele);

    /* Delete the set if it's empty */
    if (setTypeSize(set) == 0) {
        dbDelete(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_GENERIC,"del",c->argv[1],c->db->id);
    }

    /* Set has been modified */
    signalModifiedKey(c->db,c->argv[1]);
    c->vel->dirty++;
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

/* handle the "SRANDMEMBER key <count>" variant. The normal version of the
 * command is handled by the srandmemberCommand() function itself. */

/* How many times bigger should be the set compared to the requested size
 * for us to don't use the "remove elements" strategy? Read later in the
 * implementation for more info. */
#define SRANDMEMBER_SUB_STRATEGY_MUL 3

void srandmemberWithCountCommand(client *c) {
    long l;
    unsigned long count, size;
    int uniq = 1;
    robj *set, *ele;
    int64_t llele;
    int encoding;

    dict *d;

    if (getLongFromObjectOrReply(c,c->argv[2],&l,NULL) != VR_OK) return;
    if (l >= 0) {
        count = (unsigned) l;
    } else {
        /* A negative count means: return the same elements multiple times
         * (i.e. don't remove the extracted element after every extraction). */
        count = -l;
        uniq = 0;
    }

    if ((set = lookupKeyReadOrReply(c,c->argv[1],shared.emptymultibulk))
        == NULL || checkType(c,set,OBJ_SET)) return;
    size = setTypeSize(set);

    /* If count is zero, serve it ASAP to avoid special cases later. */
    if (count == 0) {
        addReply(c,shared.emptymultibulk);
        return;
    }

    /* CASE 1: The count was negative, so the extraction method is just:
     * "return N random elements" sampling the whole set every time.
     * This case is trivial and can be served without auxiliary data
     * structures. */
    if (!uniq) {
        addReplyMultiBulkLen(c,count);
        while(count--) {
            encoding = setTypeRandomElement(set,&ele,&llele);
            if (encoding == OBJ_ENCODING_INTSET) {
                addReplyBulkLongLong(c,llele);
            } else {
                addReplyBulk(c,ele);
            }
        }
        return;
    }

    /* CASE 2:
     * The number of requested elements is greater than the number of
     * elements inside the set: simply return the whole set. */
    if (count >= size) {
        //sunionDiffGenericCommand(c,c->argv+1,1,NULL,SET_OP_UNION);
        smembersGenericCommand(c, set);
        return;
    }

    /* For CASE 3 and CASE 4 we need an auxiliary dictionary. */
    d = dictCreate(&setDictType,NULL);

    /* CASE 3:
     * The number of elements inside the set is not greater than
     * SRANDMEMBER_SUB_STRATEGY_MUL times the number of requested elements.
     * In this case we create a set from scratch with all the elements, and
     * subtract random elements to reach the requested number of elements.
     *
     * This is done because if the number of requsted elements is just
     * a bit less than the number of elements in the set, the natural approach
     * used into CASE 3 is highly inefficient. */
    if (count*SRANDMEMBER_SUB_STRATEGY_MUL > size) {
        setTypeIterator *si;

        /* Add all the elements into the temporary dictionary. */
        si = setTypeInitIterator(set);
        while((encoding = setTypeNext(si,&ele,&llele)) != -1) {
            int retval = DICT_ERR;

            if (encoding == OBJ_ENCODING_INTSET) {
                retval = dictAdd(d,createStringObjectFromLongLong(llele),NULL);
            } else {
                retval = dictAdd(d,dupStringObject(ele),NULL);
            }
            ASSERT(retval == DICT_OK);
        }
        setTypeReleaseIterator(si);
        ASSERT(dictSize(d) == size);

        /* Remove random elements to reach the right count. */
        while(size > count) {
            dictEntry *de;

            de = dictGetRandomKey(d);
            dictDelete(d,dictGetKey(de));
            size--;
        }
    }

    /* CASE 4: We have a big set compared to the requested number of elements.
     * In this case we can simply get random elements from the set and add
     * to the temporary set, trying to eventually get enough unique elements
     * to reach the specified count. */
    else {
        unsigned long added = 0;

        while(added < count) {
            encoding = setTypeRandomElement(set,&ele,&llele);
            if (encoding == OBJ_ENCODING_INTSET) {
                ele = createStringObjectFromLongLong(llele);
            } else {
                ele = dupStringObject(ele);
            }
            /* Try to add the object to the dictionary. If it already exists
             * free it, otherwise increment the number of objects we have
             * in the result dictionary. */
            if (dictAdd(d,ele,NULL) == DICT_OK)
                added++;
            else
                decrRefCount(ele);
        }
    }

    /* CASE 3 & 4: send the result to the user. */
    {
        dictIterator *di;
        dictEntry *de;

        addReplyMultiBulkLen(c,count);
        di = dictGetIterator(d);
        while((de = dictNext(di)) != NULL)
            addReplyBulk(c,dictGetKey(de));
        dictReleaseIterator(di);
        dictRelease(d);
    }
}

void srandmemberCommand(client *c) {
    robj *set, *ele;
    int64_t llele;
    int encoding;

    if (c->argc == 3) {
        srandmemberWithCountCommand(c);
        return;
    } else if (c->argc > 3) {
        addReply(c,shared.syntaxerr);
        return;
    }

    if ((set = lookupKeyReadOrReply(c,c->argv[1],shared.nullbulk)) == NULL ||
        checkType(c,set,OBJ_SET)) return;

    encoding = setTypeRandomElement(set,&ele,&llele);
    if (encoding == OBJ_ENCODING_INTSET) {
        addReplyBulkLongLong(c,llele);
    } else {
        addReplyBulk(c,ele);
    }
}

void smembersCommand(client *c) {
    robj *set;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    set = lookupKeyReadOrReply(c,c->argv[1],shared.emptymultibulk);
    if (set == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if(checkType(c,set,OBJ_SET)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    smembersGenericCommand(c, set);
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

int qsortCompareSetsByCardinality(const void *s1, const void *s2) {
    return setTypeSize(*(robj**)s1)-setTypeSize(*(robj**)s2);
}

/* This is used by SDIFF and in this case we can receive NULL that should
 * be handled as empty sets. */
int qsortCompareSetsByRevCardinality(const void *s1, const void *s2) {
    robj *o1 = *(robj**)s1, *o2 = *(robj**)s2;

    return  (o2 ? setTypeSize(o2) : 0) - (o1 ? setTypeSize(o1) : 0);
}

void sinterGenericCommand(client *c, robj **setkeys,
                          unsigned long setnum, robj *dstkey) {
    setTypeIterator *si;
    robj *eleobj, *dstset = NULL;
    int64_t intobj;
    unsigned long j, cardinality = 0;
    int encoding;
    robj *setobj, *min_len_set;
    unsigned long min_len = -1;
    unsigned long min_len_idx = 0;

    for (j = 0; j < setnum; j++) {
        fetchInternalDbByKey(c,setkeys[j]);
        lockDbRead(c->db);
        setobj = lookupKeyRead(c->db,setkeys[j]);
        if (!setobj) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats,keyspace_misses,1);
            if (dstkey) {
                fetchInternalDbByKey(c,dstkey);
                lockDbWrite(c->db);
                if (dbDelete(c->db,dstkey)) {
                    signalModifiedKey(c->db,dstkey);
                    c->vel->dirty++;
                }
                unlockDb(c->db);
                addReply(c,shared.czero);
            } else {
                addReply(c,shared.emptymultibulk);
            }
            return;
        }
        if (checkType(c,setobj,OBJ_SET)) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats,keyspace_hits,1);
            return;
        }

        if (min_len == -1 || setTypeSize(setobj) < min_len) {
            min_len = setTypeSize(setobj);
            min_len_idx = j;
        }

        unlockDb(c->db);
        update_stats_add(c->vel->stats,keyspace_hits,1);
    }

    min_len_set = createIntsetObject();
    fetchInternalDbByKey(c,setkeys[min_len_idx]);
    lockDbRead(c->db);
    setobj = lookupKeyRead(c->db,setkeys[min_len_idx]);
    if (!setobj) {
        unlockDb(c->db);
        freeObject(min_len_set);
        goto done;
    }
    if (checkType(c,setobj,OBJ_SET)) {
        unlockDb(c->db);
        freeObject(min_len_set);
        return;
    }
    si = setTypeInitIterator(setobj);
    while((eleobj = setTypeNextObject(si)) != NULL) {
        setTypeAdd(min_len_set,eleobj);
        if (si->encoding == OBJ_ENCODING_INTSET) 
            freeObject(eleobj); /* free this object for intset type */
    }
    setTypeReleaseIterator(si);
    unlockDb(c->db);

    dstset = createIntsetObject();

    /* Iterate all the elements of the first (smallest) set, and test
     * the element against all the other sets, if at least one set does
     * not include the element it is discarded */
    si = setTypeInitIterator(min_len_set);
    while((encoding = setTypeNext(si,&eleobj,&intobj)) != -1) {
        for (j = 0; j < setnum; j++) {
            if (j == min_len_idx) continue;
            fetchInternalDbByKey(c,setkeys[j]);
            lockDbRead(c->db);
            setobj = lookupKeyRead(c->db,setkeys[j]);
            if (!setobj) {
                unlockDb(c->db);
                freeObject(min_len_set);
                if (dstset) {
                    freeObject(dstset);
                    dstset = NULL;
                }
                setTypeReleaseIterator(si);
                goto done;
            }
            if (checkType(c,setobj,OBJ_SET)) {
                unlockDb(c->db);
                freeObject(min_len_set);
                if (dstset) {
                    freeObject(dstset);
                    dstset = NULL;
                }
                setTypeReleaseIterator(si);
                return;
            }
            
            if (encoding == OBJ_ENCODING_INTSET) {
                /* intset with intset is simple... and fast */
                if (setobj->encoding == OBJ_ENCODING_INTSET &&
                    !intsetFind((intset*)setobj->ptr,intobj))
                {
                    unlockDb(c->db);
                    break;
                /* in order to compare an integer with an object we
                 * have to use the generic function, creating an object
                 * for this */
                } else if (setobj->encoding == OBJ_ENCODING_HT) {
                    eleobj = createStringObjectFromLongLong(intobj);
                    if (!setTypeIsMember(setobj,eleobj)) {
                        unlockDb(c->db);
                        freeObject(eleobj);
                        break;
                    }
                    freeObject(eleobj);
                }
            } else if (encoding == OBJ_ENCODING_HT) {
                /* Optimization... if the source object is integer
                 * encoded AND the target set is an intset, we can get
                 * a much faster path. */
                if (eleobj->encoding == OBJ_ENCODING_INT &&
                    setobj->encoding == OBJ_ENCODING_INTSET &&
                    !intsetFind((intset*)setobj->ptr,(long)eleobj->ptr))
                {
                    unlockDb(c->db);
                    break;
                /* else... object to object check is easy as we use the
                 * type agnostic API here. */
                } else if (!setTypeIsMember(setobj,eleobj)) {
                    unlockDb(c->db);
                    break;
                }
            }
            unlockDb(c->db);
        }

        /* Only take action when all sets contain the member */
        if (j == setnum) {
            if (encoding == OBJ_ENCODING_INTSET) {
                eleobj = createStringObjectFromLongLong(intobj);
                setTypeAdd(dstset,eleobj);
                freeObject(eleobj);
            } else {
                setTypeAdd(dstset,eleobj);
            }
            cardinality ++;
        }
    }
    setTypeReleaseIterator(si);
    freeObject(min_len_set);

done:
    if (dstkey) {
        fetchInternalDbByKey(c,dstkey);
        lockDbWrite(c->db);
        /* Store the resulting set into the target, if the intersection
            * is not an empty set. */
        int deleted = dbDelete(c->db,dstkey);
        if (dstset && setTypeSize(dstset) > 0) {
            dbAdd(c->db,dstkey,dstset);
            addReplyLongLong(c,setTypeSize(dstset));
            notifyKeyspaceEvent(NOTIFY_SET,"sinterstore",
                dstkey,c->db->id);
        } else {
            if (dstset) {
                freeObject(dstset);
                dstset = NULL;
            }
            addReply(c,shared.czero);
            if (deleted)
                notifyKeyspaceEvent(NOTIFY_GENERIC,"del",
                    dstkey,c->db->id);
        }
        signalModifiedKey(c->db,dstkey);
        unlockDb(c->db);
        c->vel->dirty++;
    } else {
        addReplyMultiBulkLen(c,cardinality);
        if (dstset && setTypeSize(dstset) > 0) {
            si = setTypeInitIterator(dstset);
            while((eleobj = setTypeNextObject(si)) != NULL) {
                addReplyBulk(c,eleobj);
                if (si->encoding == OBJ_ENCODING_INTSET) 
                    freeObject(eleobj); /* free this object for intset type */
            }
            setTypeReleaseIterator(si);
        }
        if (dstset) freeObject(dstset);
    }
}

void sinterCommand(client *c) {
    sinterGenericCommand(c,c->argv+1,c->argc-1,NULL);
}

void sinterstoreCommand(client *c) {
    sinterGenericCommand(c,c->argv+2,c->argc-2,c->argv[1]);
}

#define SET_OP_UNION 0
#define SET_OP_DIFF 1
#define SET_OP_INTER 2

void sunionDiffGenericCommand(client *c, robj **setkeys, int setnum,
                              robj *dstkey, int op) {
    setTypeIterator *si;
    robj *ele, *dstset = NULL;
    int j, cardinality = 0;
    int diff_algo = 1;
    robj *setobj;
    long long algo_one_work = 0, algo_two_work = 0;
    long long first_length = 0;

    for (j = 0; j < setnum; j++) {
        fetchInternalDbByKey(c,setkeys[j]);
        lockDbRead(c->db);
        setobj = lookupKeyRead(c->db,setkeys[j]);
        if (!setobj) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats,keyspace_misses,1);
            continue;
        }
        if (checkType(c,setobj,OBJ_SET)) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats,keyspace_hits,1);
            return;
        }
        
        if (op == SET_OP_DIFF) {
            if (j == 0) first_length = setTypeSize(setobj);
            algo_one_work += first_length;
            algo_two_work += setTypeSize(setobj);
        }

        unlockDb(c->db);
        update_stats_add(c->vel->stats,keyspace_hits,1);
    }

    /* Select what DIFF algorithm to use.
     *
     * Algorithm 1 is O(N*M) where N is the size of the element first set
     * and M the total number of sets.
     *
     * Algorithm 2 is O(N) where N is the total number of elements in all
     * the sets.
     *
     * We compute what is the best bet with the current input here. */
    if (op == SET_OP_DIFF) {
        /* Algorithm 1 has better constant times and performs less operations
         * if there are elements in common. Give it some advantage. */
        algo_one_work /= 2;
        diff_algo = (algo_one_work <= algo_two_work) ? 1 : 2;
    }

    /* We need a temp set object to store our union. If the dstkey
     * is not NULL (that is, we are inside an SUNIONSTORE operation) then
     * this set object will be the resulting object to set into the target key*/
    dstset = createIntsetObject();

    if (op == SET_OP_UNION) {
        /* Union is trivial, just add every element of every set to the
         * temporary set. */
        for (j = 0; j < setnum; j++) {
            fetchInternalDbByKey(c,setkeys[j]);
            lockDbRead(c->db);
            setobj = lookupKeyRead(c->db,setkeys[j]);

            if (!setobj) {
                unlockDb(c->db);
                continue;
            }
            if (checkType(c,setobj,OBJ_SET)) {
                unlockDb(c->db);
                freeObject(dstset);
                return;
            }

            si = setTypeInitIterator(setobj);
            while((ele = setTypeNextObject(si)) != NULL) {
                if (setTypeAdd(dstset,ele)) cardinality++;
                if (si->encoding == OBJ_ENCODING_INTSET)
                    freeObject(ele); /* free this object for intset type */
            }
            setTypeReleaseIterator(si);
            unlockDb(c->db);
        }
    } else if (op == SET_OP_DIFF && diff_algo == 1) {
        /* DIFF Algorithm 1:
         *
         * We perform the diff by iterating all the elements of the first set,
         * and only adding it to the target set if the element does not exist
         * into all the other sets.
         *
         * This way we perform at max N*M operations, where N is the size of
         * the first set, and M the number of sets. */
        robj *first_set;
        
        first_set = createIntsetObject();
        fetchInternalDbByKey(c,setkeys[0]);
        lockDbRead(c->db);
        setobj = lookupKeyRead(c->db,setkeys[0]);
        if (!setobj) {
            unlockDb(c->db);
            freeObject(first_set);
            goto done;
        }
        if (checkType(c,setobj,OBJ_SET)) {
            unlockDb(c->db);
            freeObject(dstset);
            freeObject(first_set);
            return;
        }
        si = setTypeInitIterator(setobj);
        while((ele = setTypeNextObject(si)) != NULL) {
            setTypeAdd(first_set,ele);
            if (si->encoding == OBJ_ENCODING_INTSET) 
                freeObject(ele); /* free this object for intset type */
        }
        setTypeReleaseIterator(si);
        unlockDb(c->db);

        si = setTypeInitIterator(first_set);
        while((ele = setTypeNextObject(si)) != NULL) {
            for (j = 1; j < setnum; j++) {
                fetchInternalDbByKey(c,setkeys[j]);
                lockDbRead(c->db);
                setobj = lookupKeyRead(c->db,setkeys[j]);
                if (!setobj) {
                    unlockDb(c->db);
                    continue;
                }
                if (checkType(c,setobj,OBJ_SET)) {
                    unlockDb(c->db);
                    freeObject(dstset);
                    freeObject(first_set);
                    if (si->encoding == OBJ_ENCODING_INTSET) 
                        freeObject(ele); /* free this object for intset type */
                    setTypeReleaseIterator(si);
                    return;
                }
                if (setTypeIsMember(setobj,ele)) {
                    unlockDb(c->db);
                    break;
                }
                unlockDb(c->db);
            }

            if (j == setnum) {
                /* There is no other set with this element. Add it. */
                setTypeAdd(dstset,ele);
                cardinality++;
            }

            if (si->encoding == OBJ_ENCODING_INTSET) 
                freeObject(ele); /* free this object for intset type */
        }
        setTypeReleaseIterator(si);
        freeObject(first_set);
    } else if (op == SET_OP_DIFF && diff_algo == 2) {
        /* DIFF Algorithm 2:
            *
            * Add all the elements of the first set to the auxiliary set.
            * Then remove all the elements of all the next sets from it.
            *
            * This is O(N) where N is the sum of all the elements in every
            * set. */
        for (j = 0; j < setnum; j++) {
            fetchInternalDbByKey(c,setkeys[0]);
            lockDbRead(c->db);
            setobj = lookupKeyRead(c->db,setkeys[0]);
            if (!setobj) {
                if (j == 0) {
                    unlockDb(c->db);
                    goto done;
                }
                
                unlockDb(c->db);
                continue; /* non existing keys are like empty sets */
            }
            if (checkType(c,setobj,OBJ_SET)) {
                unlockDb(c->db);
                freeObject(dstset);
                return;
            }

            si = setTypeInitIterator(setobj);
            while((ele = setTypeNextObject(si)) != NULL) {
                if (j == 0) {
                    if (setTypeAdd(dstset,ele)) cardinality++;
                } else {
                    if (setTypeRemove(dstset,ele)) cardinality--;
                }
                if (si->encoding == OBJ_ENCODING_INTSET) 
                    freeObject(ele); /* free this object for intset type */
            }
            setTypeReleaseIterator(si);

            /* Exit if result set is empty as any additional removal
                    * of elements will have no effect. */
            if (cardinality == 0) {
                unlockDb(c->db);
                break;
            }
            unlockDb(c->db);
        }
    }

done:
    /* Output the content of the resulting set, if not in STORE mode */
    if (!dstkey) {
        addReplyMultiBulkLen(c,cardinality);
        si = setTypeInitIterator(dstset);
        while((ele = setTypeNextObject(si)) != NULL) {
            addReplyBulk(c,ele);
            if (si->encoding == OBJ_ENCODING_INTSET) 
                freeObject(ele); /* free this object for intset type */
        }
        setTypeReleaseIterator(si);
        freeObject(dstset);
    } else {
        fetchInternalDbByKey(c,dstkey);
        lockDbWrite(c->db);
        /* If we have a target key where to store the resulting set
         * create this key with the result set inside */
        int deleted = dbDelete(c->db,dstkey);
        if (setTypeSize(dstset) > 0) {
            dbAdd(c->db,dstkey,dstset);
            addReplyLongLong(c,setTypeSize(dstset));
            notifyKeyspaceEvent(NOTIFY_SET,
                op == SET_OP_UNION ? "sunionstore" : "sdiffstore",
                dstkey,c->db->id);
        } else {
            freeObject(dstset);
            addReply(c,shared.czero);
            if (deleted)
                notifyKeyspaceEvent(NOTIFY_GENERIC,"del",
                    dstkey,c->db->id);
        }
        unlockDb(c->db);
        signalModifiedKey(c->db,dstkey);
        c->vel->dirty++;
    }
}

void sunionCommand(client *c) {
    sunionDiffGenericCommand(c,c->argv+1,c->argc-1,NULL,SET_OP_UNION);
}

void sunionstoreCommand(client *c) {
    sunionDiffGenericCommand(c,c->argv+2,c->argc-2,c->argv[1],SET_OP_UNION);
}

void sdiffCommand(client *c) {
    sunionDiffGenericCommand(c,c->argv+1,c->argc-1,NULL,SET_OP_DIFF);
}

void sdiffstoreCommand(client *c) {
    sunionDiffGenericCommand(c,c->argv+2,c->argc-2,c->argv[1],SET_OP_DIFF);
}

void sscanCommand(client *c) {
    scanGenericCommand(c,SCAN_TYPE_SET);
}


================================================
FILE: src/vr_t_set.h
================================================
#ifndef _VR_T_SET_H_
#define _VR_T_SET_H_

robj *setTypeCreate(robj *value);
int setTypeAdd(robj *subject, robj *value);
int setTypeRemove(robj *setobj, robj *value);
int setTypeIsMember(robj *subject, robj *value);
setTypeIterator *setTypeInitIterator(robj *subject);
void setTypeReleaseIterator(setTypeIterator *si);
int setTypeNext(setTypeIterator *si, robj **objele, int64_t *llele);
robj *setTypeNextObject(setTypeIterator *si);
int setTypeRandomElement(robj *setobj, robj **objele, int64_t *llele);

unsigned long setTypeSize(robj *subject);
void setTypeConvert(robj *setobj, int enc);
void saddCommand(client *c);
void sremCommand(client *c);
void smoveCommand(client *c);
void sismemberCommand(client *c);
void scardCommand(client *c);
void spopWithCountCommand(client *c);
void spopCommand(client *c);
void srandmemberWithCountCommand(client *c);
void srandmemberCommand(client *c);
void smembersCommand(client *c);
int qsortCompareSetsByCardinality(const void *s1, const void *s2);
int qsortCompareSetsByRevCardinality(const void *s1, const void *s2);
void sinterGenericCommand(client *c, robj **setkeys, unsigned long setnum, robj *dstkey);
void sinterCommand(client *c);
void sinterstoreCommand(client *c);
void sunionDiffGenericCommand(client *c, robj **setkeys, int setnum, robj *dstkey, int op);
void sunionCommand(client *c);
void sunionstoreCommand(client *c);
void sdiffCommand(client *c);
void sdiffstoreCommand(client *c);
void sscanCommand(client *c);

#endif


================================================
FILE: src/vr_t_string.c
================================================
#include <vr_core.h>

/*-----------------------------------------------------------------------------
 * String Commands
 *----------------------------------------------------------------------------*/

static int checkStringLength(client *c, long long size) {
    if (size > 512*1024*1024) {
        addReplyError(c,"string exceeds maximum allowed size (512MB)");
        return VR_ERROR;
    }
    return VR_OK;
}

/* The setGenericCommand() function implements the SET operation with different
 * options and variants. This function is called in order to implement the
 * following commands: SET, SETEX, PSETEX, SETNX.
 *
 * 'flags' changes the behavior of the command (NX or XX, see belove).
 *
 * 'expire' represents an expire to set in form of a Redis object as passed
 * by the user. It is interpreted according to the specified 'unit'.
 *
 * 'ok_reply' and 'abort_reply' is what the function will reply to the client
 * if the operation is performed, or when it is not because of NX or
 * XX flags.
 *
 * If ok_reply is NULL "+OK" is used.
 * If abort_reply is NULL, "$-1" is used. */

#define OBJ_SET_NO_FLAGS 0
#define OBJ_SET_NX (1<<0)     /* Set if key not exists. */
#define OBJ_SET_XX (1<<1)     /* Set if key exists. */
#define OBJ_SET_EX (1<<2)     /* Set if time in seconds is given */
#define OBJ_SET_PX (1<<3)     /* Set if time in ms in given */

void setGenericCommand(client *c, int flags, robj *key, robj *val, robj *expire, int unit, robj *ok_reply, robj *abort_reply) {
    long long milliseconds = 0; /* initialized to avoid any harmness warning */
    int expired = 0;
    int exist;

    if (expire) {
        if (getLongLongFromObjectOrReply(c, expire, &milliseconds, NULL) != VR_OK)
            return;
        if (milliseconds <= 0) {
            addReplyErrorFormat(c,"invalid expire time in %s",c->cmd->name);
            return;
        }
        if (unit == UNIT_SECONDS) milliseconds *= 1000;
    }

    fetchInternalDbByKey(c,key);
    lockDbWrite(c->db);
    if (lookupKeyWrite(c->db,key,&expired) == NULL)
        exist = 0;
    else
        exist = 1;

    if ((flags & OBJ_SET_NX && exist) ||
        (flags & OBJ_SET_XX && !exist))
    {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
        addReply(c, abort_reply ? abort_reply : shared.nullbulk);
        return;
    }

    setKey(c->db,key,dupStringObjectUnconstant(val),NULL);
    c->vel->dirty++;
    if (expire) setExpire(c->db,key,vr_msec_now()+milliseconds);
    notifyKeyspaceEvent(NOTIFY_STRING,"set",key,c->db->id);
    if (expire) notifyKeyspaceEvent(NOTIFY_GENERIC,
        "expire",key,c->db->id);
    addReply(c, ok_reply ? ok_reply : shared.ok);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

/* SET key value [NX] [XX] [EX <seconds>] [PX <milliseconds>] */
void setCommand(client *c) {
    int j;
    robj *expire = NULL;
    int unit = UNIT_SECONDS;
    int flags = OBJ_SET_NO_FLAGS;

    for (j = 3; j < c->argc; j++) {
        char *a = c->argv[j]->ptr;
        robj *next = (j == c->argc-1) ? NULL : c->argv[j+1];

        if ((a[0] == 'n' || a[0] == 'N') &&
            (a[1] == 'x' || a[1] == 'X') && a[2] == '\0' &&
            !(flags & OBJ_SET_XX))
        {
            flags |= OBJ_SET_NX;
        } else if ((a[0] == 'x' || a[0] == 'X') &&
                   (a[1] == 'x' || a[1] == 'X') && a[2] == '\0' &&
                   !(flags & OBJ_SET_NX))
        {
            flags |= OBJ_SET_XX;
        } else if ((a[0] == 'e' || a[0] == 'E') &&
                   (a[1] == 'x' || a[1] == 'X') && a[2] == '\0' &&
                   !(flags & OBJ_SET_PX) && next)
        {
            flags |= OBJ_SET_EX;
            unit = UNIT_SECONDS;
            expire = next;
            j++;
        } else if ((a[0] == 'p' || a[0] == 'P') &&
                   (a[1] == 'x' || a[1] == 'X') && a[2] == '\0' &&
                   !(flags & OBJ_SET_EX) && next)
        {
            flags |= OBJ_SET_PX;
            unit = UNIT_MILLISECONDS;
            expire = next;
            j++;
        } else {
            addReply(c,shared.syntaxerr);
            return;
        }
    }

    c->argv[2] = tryObjectEncoding(c->argv[2]);
    setGenericCommand(c,flags,c->argv[1],c->argv[2],expire,unit,NULL,NULL);
}

void setnxCommand(client *c) {
    c->argv[2] = tryObjectEncoding(c->argv[2]);
    setGenericCommand(c,OBJ_SET_NX,c->argv[1],c->argv[2],NULL,0,shared.cone,shared.czero);
}

void setexCommand(client *c) {
    c->argv[3] = tryObjectEncoding(c->argv[3]);
    setGenericCommand(c,OBJ_SET_NO_FLAGS,c->argv[1],c->argv[3],c->argv[2],UNIT_SECONDS,NULL,NULL);
}

void psetexCommand(client *c) {
    c->argv[3] = tryObjectEncoding(c->argv[3]);
    setGenericCommand(c,OBJ_SET_NO_FLAGS,c->argv[1],c->argv[3],c->argv[2],UNIT_MILLISECONDS,NULL,NULL);
}

int getGenericCommand(client *c) {
    robj *o;
    
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.nullbulk)) == NULL) {
        return VR_OK;
    }
    
    if (o->type != OBJ_STRING) {
        addReply(c,shared.wrongtypeerr);
        return VR_ERROR;
    } else {
        addReplyBulk(c,o);
        return VR_OK;
    }
}

void getCommand(client *c) {
    robj *o;

    fetchInternalDbByKey(c,c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.nullbulk)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    }

    if (o->type != OBJ_STRING) {
        addReply(c,shared.wrongtypeerr);
    } else {
        addReplyBulk(c,o);
    }
    
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void getsetCommand(client *c) {
    robj *key, *val;
    int expired = 0;
    int exist;

    key = c->argv[1];
    c->argv[2] = tryObjectEncoding(c->argv[2]);
    
    fetchInternalDbByKey(c,key);
    lockDbWrite(c->db);
    val = lookupKeyWriteOrReply(c,key,shared.nullbulk,&expired);
    if (val == NULL) {
        exist = 0;
        dbAdd(c->db,key,dupStringObjectUnconstant(c->argv[2]));
    } else {    
        exist = 1;
        if (val->type != OBJ_STRING) {
            addReply(c,shared.wrongtypeerr);
            goto end;
        }

        addReplyBulk(c,val);
        dbOverwrite(c->db,key,dupStringObjectUnconstant(c->argv[2]));
        removeExpire(c->db,key);
    }

    notifyKeyspaceEvent(NOTIFY_STRING,"set",c->argv[1],c->db->id);
    c->vel->dirty++;
    
end:
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
    if (exist)
        update_stats_add(c->vel->stats, keyspace_hits, 1);
    else
        update_stats_add(c->vel->stats, keyspace_misses, 1);
}

void setrangeCommand(client *c) {
    robj *o;
    long offset;
    sds value = c->argv[3]->ptr;
    int expired = 0;

    if (getLongFromObjectOrReply(c,c->argv[2],&offset,NULL) != VR_OK)
        return;

    if (offset < 0) {
        addReplyError(c,"offset is out of range");
        return;
    }

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    o = lookupKeyWrite(c->db,c->argv[1],&expired);
    if (o == NULL) {
        /* Return 0 when setting nothing on a non-existing string */
        if (sdslen(value) == 0) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            addReply(c,shared.czero);
            return;
        }

        /* Return when the resulting string exceeds allowed size */
        if (checkStringLength(c,offset+sdslen(value)) != VR_OK) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            return;
        }

        o = createObject(OBJ_STRING,sdsnewlen(NULL, offset+sdslen(value)));
        dbAdd(c->db,c->argv[1],o);
    } else {
        size_t olen;

        /* Key exists, check type */
        if (checkType(c,o,OBJ_STRING)) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            return;
        }

        /* Return existing string length when setting nothing */
        olen = stringObjectLen(o);
        if (sdslen(value) == 0) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            addReplyLongLong(c,olen);
            return;
        }

        /* Return when the resulting string exceeds allowed size */
        if (checkStringLength(c,offset+sdslen(value)) != VR_OK) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            return;
        }

        /* Create a copy when the object is shared or encoded. */
        o = dbUnshareStringValue(c->db,c->argv[1],o);
    }

    if (sdslen(value) > 0) {
        o->ptr = sdsgrowzero(o->ptr,offset+sdslen(value));
        memcpy((char*)o->ptr+offset,value,sdslen(value));
        signalModifiedKey(c->db,c->argv[1]);
        notifyKeyspaceEvent(NOTIFY_STRING,
            "setrange",c->argv[1],c->db->id);
        c->vel->dirty++;
    }
    addReplyLongLong(c,sdslen(o->ptr));
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void getrangeCommand(client *c) {
    robj *o;
    long long start, end;
    char *str, llbuf[32];
    size_t strlen;

    if (getLongLongFromObjectOrReply(c,c->argv[2],&start,NULL) != VR_OK)
        return;
    if (getLongLongFromObjectOrReply(c,c->argv[3],&end,NULL) != VR_OK)
        return;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.emptybulk)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,o,OBJ_STRING)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    if (o->encoding == OBJ_ENCODING_INT) {
        str = llbuf;
        strlen = ll2string(llbuf,sizeof(llbuf),(long)o->ptr);
    } else {
        str = o->ptr;
        strlen = sdslen(str);
    }

    /* Convert negative indexes */
    if (start < 0) start = strlen+start;
    if (end < 0) end = strlen+end;
    if (start < 0) start = 0;
    if (end < 0) end = 0;
    if ((unsigned long long)end >= strlen) end = strlen-1;

    /* Precondition: end >= 0 && end < strlen, so the only condition where
     * nothing can be returned is: start > end. */
    if (start > end || strlen == 0) {
        addReply(c,shared.emptybulk);
    } else {
        addReplyBulkCBuffer(c,(char*)str+start,end-start+1);
    }
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void mgetCommand(client *c) {
    int j;

    addReplyMultiBulkLen(c,c->argc-1);
    for (j = 1; j < c->argc; j++) {
        fetchInternalDbByKey(c,c->argv[j]);
        lockDbRead(c->db);
        robj *o = lookupKeyRead(c->db,c->argv[j]);
        if (o == NULL) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_misses, 1);
            addReply(c,shared.nullbulk);
        } else {
            if (o->type != OBJ_STRING) {
                addReply(c,shared.nullbulk);
            } else {
                addReplyBulk(c,o);
            }
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
        }
    }
}

void msetGenericCommand(client *c, int nx) {
    int j, busykeys = 0;

    if ((c->argc % 2) == 0) {
        addReplyError(c,"wrong number of arguments for MSET");
        return;
    }
    /* Handle the NX flag. The MSETNX semantic is to return zero and don't
     * set nothing at all if at least one already key exists. */
    if (nx) {
        for (j = 1; j < c->argc; j += 2) {
            if (lookupKeyWrite(c->db,c->argv[j],NULL) != NULL) {
                busykeys++;
            }
        }
        if (busykeys) {
            addReply(c, shared.czero);
            return;
        }
    }

    for (j = 1; j < c->argc; j += 2) {
        c->argv[j+1] = tryObjectEncoding(c->argv[j+1]);
        setKey(c->db,c->argv[j],c->argv[j+1],NULL);
        notifyKeyspaceEvent(NOTIFY_STRING,"set",c->argv[j],c->db->id);
    }
    server.dirty += (c->argc-1)/2;
    addReply(c, nx ? shared.cone : shared.ok);
}

void msetCommand(client *c) {
    int j;
    int expired = 0, expired_total = 0;

    if ((c->argc % 2) == 0) {
        addReplyError(c,"wrong number of arguments for MSET");
        return;
    }

    for (j = 1; j < c->argc; j += 2) {
        c->argv[j+1] = tryObjectEncoding(c->argv[j+1]);
        fetchInternalDbByKey(c,c->argv[j]);
        lockDbWrite(c->db);
        setKey(c->db,c->argv[j],dupStringObjectUnconstant(c->argv[j+1]),&expired);
        unlockDb(c->db);
        if (expired) expired_total ++;
        notifyKeyspaceEvent(NOTIFY_STRING,"set",c->argv[j],c->db->id);
    }

    if (expired_total) update_stats_add(c->vel->stats,expiredkeys,expired_total);
    c->vel->dirty += (c->argc-1)/2;
    addReply(c, shared.ok);
}

void msetnxCommand(client *c) {
    msetGenericCommand(c,1);
}

void incrDecrCommand(client *c, long long incr) {
    long long value, oldvalue;
    robj *o, *new;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    o = lookupKeyWrite(c->db,c->argv[1],&expired);
    if (o != NULL && checkType(c,o,OBJ_STRING)) goto end;
    if (getLongLongFromObjectOrReply(c,o,&value,NULL) != VR_OK) goto end;

    oldvalue = value;
    if ((incr < 0 && oldvalue < 0 && incr < (LLONG_MIN-oldvalue)) ||
        (incr > 0 && oldvalue > 0 && incr > (LLONG_MAX-oldvalue))) {
        addReplyError(c,"increment or decrement would overflow");
        goto end;
    }
    value += incr;

    if (o && o->refcount == 1 && o->encoding == OBJ_ENCODING_INT &&
        (value < 0 || value >= OBJ_SHARED_INTEGERS) &&
        value >= LONG_MIN && value <= LONG_MAX)
    {
        new = o;
        o->ptr = (void*)((long)value);
    } else {
        new = createStringObjectFromLongLong(value);
        if (o) {
            dbOverwrite(c->db,c->argv[1],new);
        } else {
            dbAdd(c->db,c->argv[1],new);
        }
    }
    signalModifiedKey(c->db,c->argv[1]);
    notifyKeyspaceEvent(NOTIFY_STRING,"incrby",c->argv[1],c->db->id);
    c->vel->dirty++;
    addReply(c,shared.colon);
    addReply(c,new);
    addReply(c,shared.crlf);
    
end:
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats, expiredkeys, 1);
}

void incrCommand(client *c) {
    incrDecrCommand(c,1);
}

void decrCommand(client *c) {
    incrDecrCommand(c,-1);
}

void incrbyCommand(client *c) {
    long long incr;

    if (getLongLongFromObjectOrReply(c, c->argv[2], &incr, NULL) != VR_OK) return;
    incrDecrCommand(c,incr);
}

void decrbyCommand(client *c) {
    long long incr;

    if (getLongLongFromObjectOrReply(c, c->argv[2], &incr, NULL) != VR_OK) return;
    incrDecrCommand(c,-incr);
}

void incrbyfloatCommand(client *c) {
    long double incr, value;
    robj *o, *new, *aux;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    o = lookupKeyWrite(c->db,c->argv[1],&expired);
    if (o != NULL && checkType(c,o,OBJ_STRING)) goto end;
    if (getLongDoubleFromObjectOrReply(c,o,&value,NULL) != VR_OK ||
        getLongDoubleFromObjectOrReply(c,c->argv[2],&incr,NULL) != VR_OK)
        goto end;

    value += incr;
    if (isnan(value) || isinf(value)) {
        addReplyError(c,"increment would produce NaN or Infinity");
        goto end;
    }
    new = createStringObjectFromLongDouble(value,1);
    if (o)
        dbOverwrite(c->db,c->argv[1],new);
    else
        dbAdd(c->db,c->argv[1],new);
    signalModifiedKey(c->db,c->argv[1]);
    notifyKeyspaceEvent(NOTIFY_STRING,"incrbyfloat",c->argv[1],c->db->id);
    c->vel->dirty++;
    addReplyBulk(c,new);

    /* Always replicate INCRBYFLOAT as a SET command with the final value
     * in order to make sure that differences in float precision or formatting
     * will not create differences in replicas or after an AOF restart. */
    aux = createStringObject("SET",3);
    rewriteClientCommandArgument(c,0,aux);
    aux = dupStringObjectUnconstant(new);
    rewriteClientCommandArgument(c,2,aux);

end:
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void appendCommand(client *c) {
    size_t totlen;
    robj *o, *append;
    int expired = 0;

    fetchInternalDbByKey(c, c->argv[1]);
    lockDbWrite(c->db);
    o = lookupKeyWrite(c->db,c->argv[1],&expired);
    if (o == NULL) {
        /* Create the key */
        c->argv[2] = tryObjectEncoding(c->argv[2]);
        dbAdd(c->db,c->argv[1],dupStringObjectUnconstant(c->argv[2]));
        totlen = stringObjectLen(c->argv[2]);
    } else {    
        /* Key exists, check type */
        if (checkType(c,o,OBJ_STRING))
            goto end;

        /* "append" is an argument, so always an sds */
        append = c->argv[2];
        totlen = stringObjectLen(o)+sdslen(append->ptr);
        if (checkStringLength(c,totlen) != VR_OK)
            goto end;

        /* Append the value */
        o = dbUnshareStringValue(c->db,c->argv[1],o);
        o->ptr = sdscatlen(o->ptr,append->ptr,sdslen(append->ptr));
        totlen = sdslen(o->ptr);
    }
    signalModifiedKey(c->db,c->argv[1]);
    notifyKeyspaceEvent(NOTIFY_STRING,"append",c->argv[1],c->db->id);
    c->vel->dirty++;
    addReplyLongLong(c,totlen);

end:
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void strlenCommand(client *c) {
    robj *o;
    
    fetchInternalDbByKey(c, c->argv[1]);
    lockDbRead(c->db);
    if ((o = lookupKeyReadOrReply(c,c->argv[1],shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if(checkType(c,o,OBJ_STRING)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    
    addReplyLongLong(c,stringObjectLen(o));
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}


================================================
FILE: src/vr_t_string.h
================================================
#ifndef _VR_T_STRING_H_
#define _VR_T_STRING_H_

void setGenericCommand(client *c, int flags, robj *key, robj *val, robj *expire, int unit, robj *ok_reply, robj *abort_reply);
void setCommand(client *c);
void setnxCommand(client *c);
void setexCommand(client *c);
void psetexCommand(client *c);
int getGenericCommand(client *c);
void getCommand(client *c);
void getsetCommand(client *c);
void setrangeCommand(client *c);
void getrangeCommand(client *c);
void mgetCommand(client *c);
void msetGenericCommand(client *c, int nx);
void msetCommand(client *c);
void msetnxCommand(client *c);
void incrDecrCommand(client *c, long long incr);
void incrCommand(client *c);
void decrCommand(client *c);
void incrbyCommand(client *c);
void decrbyCommand(client *c);
void incrbyfloatCommand(client *c);
void appendCommand(client *c);
void strlenCommand(client *c);

#endif


================================================
FILE: src/vr_t_zset.c
================================================
#include <vr_core.h>

static int zslLexValueGteMin(robj *value, zlexrangespec *spec);
static int zslLexValueLteMax(robj *value, zlexrangespec *spec);

zskiplistNode *zslCreateNode(int level, double score, robj *obj) {
    zskiplistNode *zn = dalloc(sizeof(*zn)+level*sizeof(struct zskiplistLevel));
    zn->score = score;
    zn->obj = obj;
    return zn;
}

zskiplist *zslCreate(void) {
    int j;
    zskiplist *zsl;

    zsl = dalloc(sizeof(*zsl));
    zsl->level = 1;
    zsl->length = 0;
    zsl->header = zslCreateNode(ZSKIPLIST_MAXLEVEL,0,NULL);
    for (j = 0; j < ZSKIPLIST_MAXLEVEL; j++) {
        zsl->header->level[j].forward = NULL;
        zsl->header->level[j].span = 0;
    }
    zsl->header->backward = NULL;
    zsl->tail = NULL;
    return zsl;
}

void zslFreeNode(zskiplistNode *node) {
    /* node->obj is stored in the dict of the zset object, so we just free the node. */
    dfree(node);
}

void zslFree(zskiplist *zsl) {
    zskiplistNode *node = zsl->header->level[0].forward, *next;

    dfree(zsl->header);
    while(node) {
        next = node->level[0].forward;
        zslFreeNode(node);
        node = next;
    }
    dfree(zsl);
}

/* Returns a random level for the new skiplist node we are going to create.
 * The return value of this function is between 1 and ZSKIPLIST_MAXLEVEL
 * (both inclusive), with a powerlaw-alike distribution where higher
 * levels are less likely to be returned. */
int zslRandomLevel(void) {
    int level = 1;
    while ((random()&0xFFFF) < (ZSKIPLIST_P * 0xFFFF))
        level += 1;
    return (level<ZSKIPLIST_MAXLEVEL) ? level : ZSKIPLIST_MAXLEVEL;
}

zskiplistNode *zslInsert(zskiplist *zsl, double score, robj *obj) {
    zskiplistNode *update[ZSKIPLIST_MAXLEVEL], *x;
    unsigned int rank[ZSKIPLIST_MAXLEVEL];
    int i, level;

    ASSERT(!isnan(score));
    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        /* store rank that is crossed to reach the insert position */
        rank[i] = i == (zsl->level-1) ? 0 : rank[i+1];
        while (x->level[i].forward &&
            (x->level[i].forward->score < score ||
                (x->level[i].forward->score == score &&
                compareStringObjects(x->level[i].forward->obj,obj) < 0))) {
            rank[i] += x->level[i].span;
            x = x->level[i].forward;
        }
        update[i] = x;
    }
    /* we assume the key is not already inside, since we allow duplicated
     * scores, and the re-insertion of score and redis object should never
     * happen since the caller of zslInsert() should test in the hash table
     * if the element is already inside or not. */
    level = zslRandomLevel();
    if (level > zsl->level) {
        for (i = zsl->level; i < level; i++) {
            rank[i] = 0;
            update[i] = zsl->header;
            update[i]->level[i].span = zsl->length;
        }
        zsl->level = level;
    }
    x = zslCreateNode(level,score,obj);
    for (i = 0; i < level; i++) {
        x->level[i].forward = update[i]->level[i].forward;
        update[i]->level[i].forward = x;

        /* update span covered by update[i] as x is inserted here */
        x->level[i].span = update[i]->level[i].span - (rank[0] - rank[i]);
        update[i]->level[i].span = (rank[0] - rank[i]) + 1;
    }

    /* increment span for untouched levels */
    for (i = level; i < zsl->level; i++) {
        update[i]->level[i].span++;
    }

    x->backward = (update[0] == zsl->header) ? NULL : update[0];
    if (x->level[0].forward)
        x->level[0].forward->backward = x;
    else
        zsl->tail = x;
    zsl->length++;
    return x;
}

/* Internal function used by zslDelete, zslDeleteByScore and zslDeleteByRank */
void zslDeleteNode(zskiplist *zsl, zskiplistNode *x, zskiplistNode **update) {
    int i;
    for (i = 0; i < zsl->level; i++) {
        if (update[i]->level[i].forward == x) {
            update[i]->level[i].span += x->level[i].span - 1;
            update[i]->level[i].forward = x->level[i].forward;
        } else {
            update[i]->level[i].span -= 1;
        }
    }
    if (x->level[0].forward) {
        x->level[0].forward->backward = x->backward;
    } else {
        zsl->tail = x->backward;
    }
    while(zsl->level > 1 && zsl->header->level[zsl->level-1].forward == NULL)
        zsl->level--;
    zsl->length--;
}

/* Delete an element with matching score/object from the skiplist. */
int zslDelete(zskiplist *zsl, double score, robj *obj) {
    zskiplistNode *update[ZSKIPLIST_MAXLEVEL], *x;
    int i;

    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        while (x->level[i].forward &&
            (x->level[i].forward->score < score ||
                (x->level[i].forward->score == score &&
                compareStringObjects(x->level[i].forward->obj,obj) < 0)))
            x = x->level[i].forward;
        update[i] = x;
    }
    /* We may have multiple elements with the same score, what we need
     * is to find the element with both the right score and object. */
    x = x->level[0].forward;
    if (x && score == x->score && equalStringObjects(x->obj,obj)) {
        zslDeleteNode(zsl, x, update);
        zslFreeNode(x);
        return 1;
    }
    return 0; /* not found */
}

static int zslValueGteMin(double value, zrangespec *spec) {
    return spec->minex ? (value > spec->min) : (value >= spec->min);
}

int zslValueLteMax(double value, zrangespec *spec) {
    return spec->maxex ? (value < spec->max) : (value <= spec->max);
}

/* Returns if there is a part of the zset is in range. */
int zslIsInRange(zskiplist *zsl, zrangespec *range) {
    zskiplistNode *x;

    /* Test for ranges that will always be empty. */
    if (range->min > range->max ||
            (range->min == range->max && (range->minex || range->maxex)))
        return 0;
    x = zsl->tail;
    if (x == NULL || !zslValueGteMin(x->score,range))
        return 0;
    x = zsl->header->level[0].forward;
    if (x == NULL || !zslValueLteMax(x->score,range))
        return 0;
    return 1;
}

/* Find the first node that is contained in the specified range.
 * Returns NULL when no element is contained in the range. */
zskiplistNode *zslFirstInRange(zskiplist *zsl, zrangespec *range) {
    zskiplistNode *x;
    int i;

    /* If everything is out of range, return early. */
    if (!zslIsInRange(zsl,range)) return NULL;

    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        /* Go forward while *OUT* of range. */
        while (x->level[i].forward &&
            !zslValueGteMin(x->level[i].forward->score,range))
                x = x->level[i].forward;
    }

    /* This is an inner range, so the next node cannot be NULL. */
    x = x->level[0].forward;
    ASSERT(x != NULL);

    /* Check if score <= max. */
    if (!zslValueLteMax(x->score,range)) return NULL;
    return x;
}

/* Find the last node that is contained in the specified range.
 * Returns NULL when no element is contained in the range. */
zskiplistNode *zslLastInRange(zskiplist *zsl, zrangespec *range) {
    zskiplistNode *x;
    int i;

    /* If everything is out of range, return early. */
    if (!zslIsInRange(zsl,range)) return NULL;

    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        /* Go forward while *IN* range. */
        while (x->level[i].forward &&
            zslValueLteMax(x->level[i].forward->score,range))
                x = x->level[i].forward;
    }

    /* This is an inner range, so this node cannot be NULL. */
    ASSERT(x != NULL);

    /* Check if score >= min. */
    if (!zslValueGteMin(x->score,range)) return NULL;
    return x;
}

/* Delete all the elements with score between min and max from the skiplist.
 * Min and max are inclusive, so a score >= min || score <= max is deleted.
 * Note that this function takes the reference to the hash table view of the
 * sorted set, in order to remove the elements from the hash table too. */
unsigned long zslDeleteRangeByScore(zskiplist *zsl, zrangespec *range, dict *dict) {
    zskiplistNode *update[ZSKIPLIST_MAXLEVEL], *x;
    unsigned long removed = 0;
    int i;

    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        while (x->level[i].forward && (range->minex ?
            x->level[i].forward->score <= range->min :
            x->level[i].forward->score < range->min))
                x = x->level[i].forward;
        update[i] = x;
    }

    /* Current node is the last with score < or <= min. */
    x = x->level[0].forward;

    /* Delete nodes while in range. */
    while (x &&
           (range->maxex ? x->score < range->max : x->score <= range->max))
    {
        zskiplistNode *next = x->level[0].forward;
        zslDeleteNode(zsl,x,update);
        dictDelete(dict,x->obj);
        zslFreeNode(x);
        removed++;
        x = next;
    }
    return removed;
}

unsigned long zslDeleteRangeByLex(zskiplist *zsl, zlexrangespec *range, dict *dict) {
    zskiplistNode *update[ZSKIPLIST_MAXLEVEL], *x;
    unsigned long removed = 0;
    int i;


    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        while (x->level[i].forward &&
            !zslLexValueGteMin(x->level[i].forward->obj,range))
                x = x->level[i].forward;
        update[i] = x;
    }

    /* Current node is the last with score < or <= min. */
    x = x->level[0].forward;

    /* Delete nodes while in range. */
    while (x && zslLexValueLteMax(x->obj,range)) {
        zskiplistNode *next = x->level[0].forward;
        zslDeleteNode(zsl,x,update);
        dictDelete(dict,x->obj);
        zslFreeNode(x);
        removed++;
        x = next;
    }
    return removed;
}

/* Delete all the elements with rank between start and end from the skiplist.
 * Start and end are inclusive. Note that start and end need to be 1-based */
unsigned long zslDeleteRangeByRank(zskiplist *zsl, unsigned int start, unsigned int end, dict *dict) {
    zskiplistNode *update[ZSKIPLIST_MAXLEVEL], *x;
    unsigned long traversed = 0, removed = 0;
    int i;

    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        while (x->level[i].forward && (traversed + x->level[i].span) < start) {
            traversed += x->level[i].span;
            x = x->level[i].forward;
        }
        update[i] = x;
    }

    traversed++;
    x = x->level[0].forward;
    while (x && traversed <= end) {
        zskiplistNode *next = x->level[0].forward;
        zslDeleteNode(zsl,x,update);
        dictDelete(dict,x->obj);
        zslFreeNode(x);
        removed++;
        traversed++;
        x = next;
    }
    return removed;
}

/* Find the rank for an element by both score and key.
 * Returns 0 when the element cannot be found, rank otherwise.
 * Note that the rank is 1-based due to the span of zsl->header to the
 * first element. */
unsigned long zslGetRank(zskiplist *zsl, double score, robj *o) {
    zskiplistNode *x;
    unsigned long rank = 0;
    int i;

    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        while (x->level[i].forward &&
            (x->level[i].forward->score < score ||
                (x->level[i].forward->score == score &&
                compareStringObjects(x->level[i].forward->obj,o) <= 0))) {
            rank += x->level[i].span;
            x = x->level[i].forward;
        }

        /* x might be equal to zsl->header, so test if obj is non-NULL */
        if (x->obj && equalStringObjects(x->obj,o)) {
            return rank;
        }
    }
    return 0;
}

/* Finds an element by its rank. The rank argument needs to be 1-based. */
zskiplistNode* zslGetElementByRank(zskiplist *zsl, unsigned long rank) {
    zskiplistNode *x;
    unsigned long traversed = 0;
    int i;

    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        while (x->level[i].forward && (traversed + x->level[i].span) <= rank)
        {
            traversed += x->level[i].span;
            x = x->level[i].forward;
        }
        if (traversed == rank) {
            return x;
        }
    }
    return NULL;
}

/* Populate the rangespec according to the objects min and max. */
static int zslParseRange(robj *min, robj *max, zrangespec *spec) {
    char *eptr;
    spec->minex = spec->maxex = 0;

    /* Parse the min-max interval. If one of the values is prefixed
     * by the "(" character, it's considered "open". For instance
     * ZRANGEBYSCORE zset (1.5 (2.5 will match min < x < max
     * ZRANGEBYSCORE zset 1.5 2.5 will instead match min <= x <= max */
    if (min->encoding == OBJ_ENCODING_INT) {
        spec->min = (long)min->ptr;
    } else {
        if (((char*)min->ptr)[0] == '(') {
            spec->min = strtod((char*)min->ptr+1,&eptr);
            if (eptr[0] != '\0' || isnan(spec->min)) return VR_ERROR;
            spec->minex = 1;
        } else {
            spec->min = strtod((char*)min->ptr,&eptr);
            if (eptr[0] != '\0' || isnan(spec->min)) return VR_ERROR;
        }
    }
    if (max->encoding == OBJ_ENCODING_INT) {
        spec->max = (long)max->ptr;
    } else {
        if (((char*)max->ptr)[0] == '(') {
            spec->max = strtod((char*)max->ptr+1,&eptr);
            if (eptr[0] != '\0' || isnan(spec->max)) return VR_ERROR;
            spec->maxex = 1;
        } else {
            spec->max = strtod((char*)max->ptr,&eptr);
            if (eptr[0] != '\0' || isnan(spec->max)) return VR_ERROR;
        }
    }

    return VR_OK;
}

/* ------------------------ Lexicographic ranges ---------------------------- */

/* Parse max or min argument of ZRANGEBYLEX.
  * (foo means foo (open interval)
  * [foo means foo (closed interval)
  * - means the min string possible
  * + means the max string possible
  *
  * If the string is valid the *dest pointer is set to the redis object
  * that will be used for the comparision, and ex will be set to 0 or 1
  * respectively if the item is exclusive or inclusive. VR_OK will be
  * returned.
  *
  * If the string is not a valid range VR_ERROR is returned, and the value
  * of *dest and *ex is undefined. */
int zslParseLexRangeItem(robj *item, robj **dest, int *ex) {
    char *c = item->ptr;

    switch(c[0]) {
    case '+':
        if (c[1] != '\0') return VR_ERROR;
        *ex = 0;
        *dest = dupStringObjectUnconstant(shared.maxstring);
        return VR_OK;
    case '-':
        if (c[1] != '\0') return VR_ERROR;
        *ex = 0;
        *dest = dupStringObjectUnconstant(shared.minstring);
        return VR_OK;
    case '(':
        *ex = 1;
        *dest = createStringObject(c+1,sdslen(c)-1);
        return VR_OK;
    case '[':
        *ex = 0;
        *dest = createStringObject(c+1,sdslen(c)-1);
        return VR_OK;
    default:
        return VR_ERROR;
    }
}

/* Populate the rangespec according to the objects min and max.
 *
 * Return VR_OK on success. On error VR_ERROR is returned.
 * When OK is returned the structure must be freed with zslFreeLexRange(),
 * otherwise no release is needed. */
static int zslParseLexRange(robj *min, robj *max, zlexrangespec *spec) {
    /* The range can't be valid if objects are integer encoded.
     * Every item must start with ( or [. */
    if (min->encoding == OBJ_ENCODING_INT ||
        max->encoding == OBJ_ENCODING_INT) return VR_ERROR;

    spec->min = spec->max = NULL;
    if (zslParseLexRangeItem(min, &spec->min, &spec->minex) == VR_ERROR ||
        zslParseLexRangeItem(max, &spec->max, &spec->maxex) == VR_ERROR) {
        if (spec->min) freeObject(spec->min);
        if (spec->max) freeObject(spec->max);
        return VR_ERROR;
    } else {
        return VR_OK;
    }
}

/* Free a lex range structure, must be called only after zelParseLexRange()
 * populated the structure with success (VR_OK returned). */
void zslFreeLexRange(zlexrangespec *spec) {
    freeObject(spec->min);
    freeObject(spec->max);
}

/* This is just a wrapper to compareStringObjects() that is able to
 * handle shared.minstring and shared.maxstring as the equivalent of
 * -inf and +inf for strings */
int compareStringObjectsForLexRange(robj *a, robj *b) {
    if (a == b) return 0; /* This makes sure that we handle inf,inf and
                             -inf,-inf ASAP. One special case less. */
    if (a == shared.minstring || b == shared.maxstring) return -1;
    if (a == shared.maxstring || b == shared.minstring) return 1;
    return compareStringObjects(a,b);
}

static int zslLexValueGteMin(robj *value, zlexrangespec *spec) {
    return spec->minex ?
        (compareStringObjectsForLexRange(value,spec->min) > 0) :
        (compareStringObjectsForLexRange(value,spec->min) >= 0);
}

static int zslLexValueLteMax(robj *value, zlexrangespec *spec) {
    return spec->maxex ?
        (compareStringObjectsForLexRange(value,spec->max) < 0) :
        (compareStringObjectsForLexRange(value,spec->max) <= 0);
}

/* Returns if there is a part of the zset is in the lex range. */
int zslIsInLexRange(zskiplist *zsl, zlexrangespec *range) {
    zskiplistNode *x;

    /* Test for ranges that will always be empty. */
    if (compareStringObjectsForLexRange(range->min,range->max) > 1 ||
            (compareStringObjects(range->min,range->max) == 0 &&
            (range->minex || range->maxex)))
        return 0;
    x = zsl->tail;
    if (x == NULL || !zslLexValueGteMin(x->obj,range))
        return 0;
    x = zsl->header->level[0].forward;
    if (x == NULL || !zslLexValueLteMax(x->obj,range))
        return 0;
    return 1;
}

/* Find the first node that is contained in the specified lex range.
 * Returns NULL when no element is contained in the range. */
zskiplistNode *zslFirstInLexRange(zskiplist *zsl, zlexrangespec *range) {
    zskiplistNode *x;
    int i;

    /* If everything is out of range, return early. */
    if (!zslIsInLexRange(zsl,range)) return NULL;

    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        /* Go forward while *OUT* of range. */
        while (x->level[i].forward &&
            !zslLexValueGteMin(x->level[i].forward->obj,range))
                x = x->level[i].forward;
    }

    /* This is an inner range, so the next node cannot be NULL. */
    x = x->level[0].forward;
    ASSERT(x != NULL);

    /* Check if score <= max. */
    if (!zslLexValueLteMax(x->obj,range)) return NULL;
    return x;
}

/* Find the last node that is contained in the specified range.
 * Returns NULL when no element is contained in the range. */
zskiplistNode *zslLastInLexRange(zskiplist *zsl, zlexrangespec *range) {
    zskiplistNode *x;
    int i;

    /* If everything is out of range, return early. */
    if (!zslIsInLexRange(zsl,range)) return NULL;

    x = zsl->header;
    for (i = zsl->level-1; i >= 0; i--) {
        /* Go forward while *IN* range. */
        while (x->level[i].forward &&
            zslLexValueLteMax(x->level[i].forward->obj,range))
                x = x->level[i].forward;
    }

    /* This is an inner range, so this node cannot be NULL. */
    ASSERT(x != NULL);

    /* Check if score >= min. */
    if (!zslLexValueGteMin(x->obj,range)) return NULL;
    return x;
}

/*-----------------------------------------------------------------------------
 * Ziplist-backed sorted set API
 *----------------------------------------------------------------------------*/

double zzlGetScore(unsigned char *sptr) {
    int ret;
    unsigned char *vstr;
    unsigned int vlen;
    long long vlong;
    char buf[128];
    double score;

    ASSERT(sptr != NULL);
    
    ret = (int)ziplistGet(sptr,&vstr,&vlen,&vlong);
    ASSERT(ret > 0);

    if (vstr) {
        memcpy(buf,vstr,vlen);
        buf[vlen] = '\0';
        score = strtod(buf,NULL);
    } else {
        score = vlong;
    }

    return score;
}

/* Return a ziplist element as a Redis string object.
 * This simple abstraction can be used to simplifies some code at the
 * cost of some performance. */
robj *ziplistGetObject(unsigned char *sptr) {
    int ret;
    unsigned char *vstr;
    unsigned int vlen;
    long long vlong;

    ASSERT(sptr != NULL);

    ret = (int)ziplistGet(sptr,&vstr,&vlen,&vlong);
    ASSERT(ret > 0);

    if (vstr) {
        return createStringObject((char*)vstr,vlen);
    } else {
        return createStringObjectFromLongLong(vlong);
    }
}

/* Compare element in sorted set with given element. */
int zzlCompareElements(unsigned char *eptr, unsigned char *cstr, unsigned int clen) {
    int ret;
    unsigned char *vstr;
    unsigned int vlen;
    long long vlong;
    unsigned char vbuf[32];
    int minlen, cmp;

    ret = (int)ziplistGet(eptr,&vstr,&vlen,&vlong);
    ASSERT(ret > 0);
    if (vstr == NULL) {
        /* Store string representation of long long in buf. */
        vlen = ll2string((char*)vbuf,sizeof(vbuf),vlong);
        vstr = vbuf;
    }

    minlen = (vlen < clen) ? vlen : clen;
    cmp = memcmp(vstr,cstr,minlen);
    if (cmp == 0) return vlen-clen;
    return cmp;
}

unsigned int zzlLength(unsigned char *zl) {
    return ziplistLen(zl)/2;
}

/* Move to next entry based on the values in eptr and sptr. Both are set to
 * NULL when there is no next entry. */
void zzlNext(unsigned char *zl, unsigned char **eptr, unsigned char **sptr) {
    unsigned char *_eptr, *_sptr;
    ASSERT(*eptr != NULL && *sptr != NULL);

    _eptr = ziplistNext(zl,*sptr);
    if (_eptr != NULL) {
        _sptr = ziplistNext(zl,_eptr);
        ASSERT(_sptr != NULL);
    } else {
        /* No next entry. */
        _sptr = NULL;
    }

    *eptr = _eptr;
    *sptr = _sptr;
}

/* Move to the previous entry based on the values in eptr and sptr. Both are
 * set to NULL when there is no next entry. */
void zzlPrev(unsigned char *zl, unsigned char **eptr, unsigned char **sptr) {
    unsigned char *_eptr, *_sptr;
    ASSERT(*eptr != NULL && *sptr != NULL);

    _sptr = ziplistPrev(zl,*eptr);
    if (_sptr != NULL) {
        _eptr = ziplistPrev(zl,_sptr);
        ASSERT(_eptr != NULL);
    } else {
        /* No previous entry. */
        _eptr = NULL;
    }

    *eptr = _eptr;
    *sptr = _sptr;
}

/* Returns if there is a part of the zset is in range. Should only be used
 * internally by zzlFirstInRange and zzlLastInRange. */
int zzlIsInRange(unsigned char *zl, zrangespec *range) {
    unsigned char *p;
    double score;

    /* Test for ranges that will always be empty. */
    if (range->min > range->max ||
            (range->min == range->max && (range->minex || range->maxex)))
        return 0;

    p = ziplistIndex(zl,-1); /* Last score. */
    if (p == NULL) return 0; /* Empty sorted set */
    score = zzlGetScore(p);
    if (!zslValueGteMin(score,range))
        return 0;

    p = ziplistIndex(zl,1); /* First score. */
    ASSERT(p != NULL);
    score = zzlGetScore(p);
    if (!zslValueLteMax(score,range))
        return 0;

    return 1;
}

/* Find pointer to the first element contained in the specified range.
 * Returns NULL when no element is contained in the range. */
unsigned char *zzlFirstInRange(unsigned char *zl, zrangespec *range) {
    unsigned char *eptr = ziplistIndex(zl,0), *sptr;
    double score;

    /* If everything is out of range, return early. */
    if (!zzlIsInRange(zl,range)) return NULL;

    while (eptr != NULL) {
        sptr = ziplistNext(zl,eptr);
        ASSERT(sptr != NULL);

        score = zzlGetScore(sptr);
        if (zslValueGteMin(score,range)) {
            /* Check if score <= max. */
            if (zslValueLteMax(score,range))
                return eptr;
            return NULL;
        }

        /* Move to next element. */
        eptr = ziplistNext(zl,sptr);
    }

    return NULL;
}

/* Find pointer to the last element contained in the specified range.
 * Returns NULL when no element is contained in the range. */
unsigned char *zzlLastInRange(unsigned char *zl, zrangespec *range) {
    unsigned char *eptr = ziplistIndex(zl,-2), *sptr;
    double score;

    /* If everything is out of range, return early. */
    if (!zzlIsInRange(zl,range)) return NULL;

    while (eptr != NULL) {
        sptr = ziplistNext(zl,eptr);
        ASSERT(sptr != NULL);

        score = zzlGetScore(sptr);
        if (zslValueLteMax(score,range)) {
            /* Check if score >= min. */
            if (zslValueGteMin(score,range))
                return eptr;
            return NULL;
        }

        /* Move to previous element by moving to the score of previous element.
         * When this returns NULL, we know there also is no element. */
        sptr = ziplistPrev(zl,eptr);
        if (sptr != NULL) {
            eptr = ziplistPrev(zl,sptr);
            ASSERT(eptr != NULL);
        } else {
            eptr = NULL;
        }
    }

    return NULL;
}

static int zzlLexValueGteMin(unsigned char *p, zlexrangespec *spec) {
    robj *value = ziplistGetObject(p);
    int res = zslLexValueGteMin(value,spec);
    freeObject(value);
    return res;
}

static int zzlLexValueLteMax(unsigned char *p, zlexrangespec *spec) {
    robj *value = ziplistGetObject(p);
    int res = zslLexValueLteMax(value,spec);
    freeObject(value);
    return res;
}

/* Returns if there is a part of the zset is in range. Should only be used
 * internally by zzlFirstInRange and zzlLastInRange. */
int zzlIsInLexRange(unsigned char *zl, zlexrangespec *range) {
    unsigned char *p;

    /* Test for ranges that will always be empty. */
    if (compareStringObjectsForLexRange(range->min,range->max) > 1 ||
            (compareStringObjects(range->min,range->max) == 0 &&
            (range->minex || range->maxex)))
        return 0;

    p = ziplistIndex(zl,-2); /* Last element. */
    if (p == NULL) return 0;
    if (!zzlLexValueGteMin(p,range))
        return 0;

    p = ziplistIndex(zl,0); /* First element. */
    ASSERT(p != NULL);
    if (!zzlLexValueLteMax(p,range))
        return 0;

    return 1;
}

/* Find pointer to the first element contained in the specified lex range.
 * Returns NULL when no element is contained in the range. */
unsigned char *zzlFirstInLexRange(unsigned char *zl, zlexrangespec *range) {
    unsigned char *eptr = ziplistIndex(zl,0), *sptr;

    /* If everything is out of range, return early. */
    if (!zzlIsInLexRange(zl,range)) return NULL;

    while (eptr != NULL) {
        if (zzlLexValueGteMin(eptr,range)) {
            /* Check if score <= max. */
            if (zzlLexValueLteMax(eptr,range))
                return eptr;
            return NULL;
        }

        /* Move to next element. */
        sptr = ziplistNext(zl,eptr); /* This element score. Skip it. */
        ASSERT(sptr != NULL);
        eptr = ziplistNext(zl,sptr); /* Next element. */
    }

    return NULL;
}

/* Find pointer to the last element contained in the specified lex range.
 * Returns NULL when no element is contained in the range. */
unsigned char *zzlLastInLexRange(unsigned char *zl, zlexrangespec *range) {
    unsigned char *eptr = ziplistIndex(zl,-2), *sptr;

    /* If everything is out of range, return early. */
    if (!zzlIsInLexRange(zl,range)) return NULL;

    while (eptr != NULL) {
        if (zzlLexValueLteMax(eptr,range)) {
            /* Check if score >= min. */
            if (zzlLexValueGteMin(eptr,range))
                return eptr;
            return NULL;
        }

        /* Move to previous element by moving to the score of previous element.
         * When this returns NULL, we know there also is no element. */
        sptr = ziplistPrev(zl,eptr);
        if (sptr != NULL) {
            eptr = ziplistPrev(zl,sptr);
            ASSERT(eptr != NULL);
        } else {
            eptr = NULL;
        }
    }

    return NULL;
}

unsigned char *zzlFind(unsigned char *zl, robj *ele, double *score) {
    unsigned char *eptr = ziplistIndex(zl,0), *sptr;
    robj *ele_new;

    ele_new = getDecodedObject(ele);
    while (eptr != NULL) {
        sptr = ziplistNext(zl,eptr);
        serverAssertWithInfo(NULL,ele_new,sptr != NULL);

        if (ziplistCompare(eptr,ele_new->ptr,sdslen(ele_new->ptr))) {
            /* Matching element, pull out score. */
            if (score != NULL) *score = zzlGetScore(sptr);
            if (ele_new!= ele) freeObject(ele_new);
            return eptr;
        }

        /* Move to next element. */
        eptr = ziplistNext(zl,sptr);
    }

    if (ele_new!= ele) freeObject(ele_new);
    return NULL;
}

/* Delete (element,score) pair from ziplist. Use local copy of eptr because we
 * don't want to modify the one given as argument. */
unsigned char *zzlDelete(unsigned char *zl, unsigned char *eptr) {
    unsigned char *p = eptr;

    /* TODO: add function to ziplist API to delete N elements from offset. */
    zl = ziplistDelete(zl,&p);
    zl = ziplistDelete(zl,&p);
    return zl;
}

unsigned char *zzlInsertAt(unsigned char *zl, unsigned char *eptr, robj *ele, double score) {
    unsigned char *sptr;
    char scorebuf[128];
    int scorelen;
    size_t offset;

    serverAssertWithInfo(NULL,ele,sdsEncodedObject(ele));
    scorelen = d2string(scorebuf,sizeof(scorebuf),score);
    if (eptr == NULL) {
        zl = ziplistPush(zl,ele->ptr,sdslen(ele->ptr),ZIPLIST_TAIL);
        zl = ziplistPush(zl,(unsigned char*)scorebuf,scorelen,ZIPLIST_TAIL);
    } else {
        /* Keep offset relative to zl, as it might be re-allocated. */
        offset = eptr-zl;
        zl = ziplistInsert(zl,eptr,ele->ptr,sdslen(ele->ptr));
        eptr = zl+offset;

        /* Insert score after the element. */
        serverAssertWithInfo(NULL,ele,(sptr = ziplistNext(zl,eptr)) != NULL);
        zl = ziplistInsert(zl,sptr,(unsigned char*)scorebuf,scorelen);
    }

    return zl;
}

/* Insert (element,score) pair in ziplist. This function assumes the element is
 * not yet present in the list. */
unsigned char *zzlInsert(unsigned char *zl, robj *ele, double score) {
    unsigned char *eptr = ziplistIndex(zl,0), *sptr;
    double s;
    robj *ele_new;

    ele_new = getDecodedObject(ele);
    while (eptr != NULL) {
        sptr = ziplistNext(zl,eptr);
        serverAssertWithInfo(NULL,ele_new,sptr != NULL);
        s = zzlGetScore(sptr);

        if (s > score) {
            /* First element with score larger than score for element to be
             * inserted. This means we should take its spot in the list to
             * maintain ordering. */
            zl = zzlInsertAt(zl,eptr,ele_new,score);
            break;
        } else if (s == score) {
            /* Ensure lexicographical ordering for elements. */
            if (zzlCompareElements(eptr,ele_new->ptr,sdslen(ele_new->ptr)) > 0) {
                zl = zzlInsertAt(zl,eptr,ele_new,score);
                break;
            }
        }

        /* Move to next element. */
        eptr = ziplistNext(zl,sptr);
    }

    /* Push on tail of list when it was not yet inserted. */
    if (eptr == NULL)
        zl = zzlInsertAt(zl,NULL,ele_new,score);

    if (ele_new != ele) freeObject(ele_new);
    return zl;
}

unsigned char *zzlDeleteRangeByScore(unsigned char *zl, zrangespec *range, unsigned long *deleted) {
    unsigned char *eptr, *sptr;
    double score;
    unsigned long num = 0;

    if (deleted != NULL) *deleted = 0;

    eptr = zzlFirstInRange(zl,range);
    if (eptr == NULL) return zl;

    /* When the tail of the ziplist is deleted, eptr will point to the sentinel
     * byte and ziplistNext will return NULL. */
    while ((sptr = ziplistNext(zl,eptr)) != NULL) {
        score = zzlGetScore(sptr);
        if (zslValueLteMax(score,range)) {
            /* Delete both the element and the score. */
            zl = ziplistDelete(zl,&eptr);
            zl = ziplistDelete(zl,&eptr);
            num++;
        } else {
            /* No longer in range. */
            break;
        }
    }

    if (deleted != NULL) *deleted = num;
    return zl;
}

unsigned char *zzlDeleteRangeByLex(unsigned char *zl, zlexrangespec *range, unsigned long *deleted) {
    unsigned char *eptr, *sptr;
    unsigned long num = 0;

    if (deleted != NULL) *deleted = 0;

    eptr = zzlFirstInLexRange(zl,range);
    if (eptr == NULL) return zl;

    /* When the tail of the ziplist is deleted, eptr will point to the sentinel
     * byte and ziplistNext will return NULL. */
    while ((sptr = ziplistNext(zl,eptr)) != NULL) {
        if (zzlLexValueLteMax(eptr,range)) {
            /* Delete both the element and the score. */
            zl = ziplistDelete(zl,&eptr);
            zl = ziplistDelete(zl,&eptr);
            num++;
        } else {
            /* No longer in range. */
            break;
        }
    }

    if (deleted != NULL) *deleted = num;
    return zl;
}

/* Delete all the elements with rank between start and end from the skiplist.
 * Start and end are inclusive. Note that start and end need to be 1-based */
unsigned char *zzlDeleteRangeByRank(unsigned char *zl, unsigned int start, unsigned int end, unsigned long *deleted) {
    unsigned int num = (end-start)+1;
    if (deleted) *deleted = num;
    zl = ziplistDeleteRange(zl,2*(start-1),2*num);
    return zl;
}

/*-----------------------------------------------------------------------------
 * Common sorted set API
 *----------------------------------------------------------------------------*/

unsigned int zsetLength(robj *zobj) {
    int length = -1;
    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        length = zzlLength(zobj->ptr);
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        length = ((zset*)zobj->ptr)->zsl->length;
    } else {
        serverPanic("Unknown sorted set encoding");
    }
    return length;
}

void zsetConvert(robj *zobj, int encoding) {
    zset *zs;
    zskiplistNode *node, *next;
    robj *ele;
    double score;

    if (zobj->encoding == encoding) return;
    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl = zobj->ptr;
        unsigned char *eptr, *sptr;
        unsigned char *vstr;
        unsigned int vlen;
        long long vlong;

        if (encoding != OBJ_ENCODING_SKIPLIST)
            serverPanic("Unknown target encoding");

        zs = dalloc(sizeof(*zs));
        zs->dict = dictCreate(&zsetDictType,NULL);
        zs->zsl = zslCreate();

        eptr = ziplistIndex(zl,0);
        serverAssertWithInfo(NULL,zobj,eptr != NULL);
        sptr = ziplistNext(zl,eptr);
        serverAssertWithInfo(NULL,zobj,sptr != NULL);

        while (eptr != NULL) {
            score = zzlGetScore(sptr);
            serverAssertWithInfo(NULL,zobj,ziplistGet(eptr,&vstr,&vlen,&vlong));
            if (vstr == NULL)
                ele = createStringObjectFromLongLong(vlong);
            else
                ele = createStringObject((char*)vstr,vlen);

            /* Has incremented refcount since it was just created. */
            node = zslInsert(zs->zsl,score,ele);
            serverAssertWithInfo(NULL,zobj,dictAdd(zs->dict,ele,&node->score) == DICT_OK);
            zzlNext(zl,&eptr,&sptr);
        }

        dfree(zobj->ptr);
        zobj->ptr = zs;
        zobj->encoding = OBJ_ENCODING_SKIPLIST;
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        unsigned char *zl = ziplistNew();

        if (encoding != OBJ_ENCODING_ZIPLIST)
            serverPanic("Unknown target encoding");

        /* Approach similar to zslFree(), since we want to free the skiplist at
         * the same time as creating the ziplist. */
        zs = zobj->ptr;
        node = zs->zsl->header->level[0].forward;
        dfree(zs->zsl->header);
        dfree(zs->zsl);

        while (node) {
            ele = getDecodedObject(node->obj);
            zl = zzlInsertAt(zl,NULL,ele,node->score);
            if (ele != node->obj) freeObject(ele);
            next = node->level[0].forward;
            zslFreeNode(node);
            node = next;
        }

        dictRelease(zs->dict);
        dfree(zs);
        zobj->ptr = zl;
        zobj->encoding = OBJ_ENCODING_ZIPLIST;
    } else {
        serverPanic("Unknown sorted set encoding");
    }
}

/* Convert the sorted set object into a ziplist if it is not already a ziplist
 * and if the number of elements and the maximum element size is within the
 * expected ranges. */
void zsetConvertToZiplistIfNeeded(robj *zobj, size_t maxelelen) {
    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) return;
    zset *zset = zobj->ptr;

    if (zset->zsl->length <= server.zset_max_ziplist_entries &&
        maxelelen <= server.zset_max_ziplist_value)
            zsetConvert(zobj,OBJ_ENCODING_ZIPLIST);
}

/* Return (by reference) the score of the specified member of the sorted set
 * storing it into *score. If the element does not exist VR_ERROR is returned
 * otherwise VR_OK is returned and *score is correctly populated.
 * If 'zobj' or 'member' is NULL, VR_ERROR is returned. */
int zsetScore(robj *zobj, robj *member, double *score) {
    if (!zobj || !member) return VR_ERROR;

    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        if (zzlFind(zobj->ptr, member, score) == NULL) return VR_ERROR;
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = zobj->ptr;
        dictEntry *de = dictFind(zs->dict, member);
        if (de == NULL) return VR_ERROR;
        *score = *(double*)dictGetVal(de);
    } else {
        serverPanic("Unknown sorted set encoding");
    }
    return VR_OK;
}

/*-----------------------------------------------------------------------------
 * Sorted set commands
 *----------------------------------------------------------------------------*/

/* This generic command implements both ZADD and ZINCRBY. */
#define ZADD_NONE 0
#define ZADD_INCR (1<<0)    /* Increment the score instead of setting it. */
#define ZADD_NX (1<<1)      /* Don't touch elements not already existing. */
#define ZADD_XX (1<<2)      /* Only touch elements already exisitng. */
#define ZADD_CH (1<<3)      /* Return num of elements added or updated. */

void zaddGenericCommand(client *c, int flags) {
    static char *nanerr = "resulting score is not a number (NaN)";
    robj *key = c->argv[1];
    robj *ele;
    robj *zobj;
    robj *curobj;
    double score = 0, *scores = NULL, curscore = 0.0;
    int j, elements;
    int scoreidx = 0;
    /* The following vars are used in order to track what the command actually
     * did during the execution, to reply to the client and to trigger the
     * notification of keyspace change. */
    int added = 0;      /* Number of new elements added. */
    int updated = 0;    /* Number of elements with updated score. */
    int processed = 0;  /* Number of elements processed, may remain zero with
                           options like XX. */
    int expired = 0;

    /* Parse options. At the end 'scoreidx' is set to the argument position
     * of the score of the first score-element pair. */
    scoreidx = 2;
    while(scoreidx < c->argc) {
        char *opt = c->argv[scoreidx]->ptr;
        if (!strcasecmp(opt,"nx")) flags |= ZADD_NX;
        else if (!strcasecmp(opt,"xx")) flags |= ZADD_XX;
        else if (!strcasecmp(opt,"ch")) flags |= ZADD_CH;
        else if (!strcasecmp(opt,"incr")) flags |= ZADD_INCR;
        else break;
        scoreidx++;
    }

    /* Turn options into simple to check vars. */
    int incr = (flags & ZADD_INCR) != 0;
    int nx = (flags & ZADD_NX) != 0;
    int xx = (flags & ZADD_XX) != 0;
    int ch = (flags & ZADD_CH) != 0;

    /* After the options, we expect to have an even number of args, since
     * we expect any number of score-element pairs. */
    elements = c->argc-scoreidx;
    if (elements % 2) {
        addReply(c,shared.syntaxerr);
        return;
    }
    elements /= 2; /* Now this holds the number of score-element pairs. */

    /* Check for incompatible options. */
    if (nx && xx) {
        addReplyError(c,
            "XX and NX options at the same time are not compatible");
        return;
    }

    if (incr && elements > 1) {
        addReplyError(c,
            "INCR option supports a single increment-element pair");
        return;
    }

    /* Start parsing all the scores, we need to emit any syntax error
     * before executing additions to the sorted set, as the command should
     * either execute fully or nothing at all. */
    scores = dalloc(sizeof(double)*elements);
    for (j = 0; j < elements; j++) {
        if (getDoubleFromObjectOrReply(c,c->argv[scoreidx+j*2],&scores[j],NULL)
            != VR_OK) goto cleanup;
    }
   
    fetchInternalDbByKey(c, key);
    lockDbWrite(c->db);
    /* Lookup the key and create the sorted set if does not exist. */
    zobj = lookupKeyWrite(c->db,key,&expired);
    if (zobj == NULL) {
        if (xx) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            goto reply_to_client; /* No key + XX option: nothing to do. */
        }
        if (server.zset_max_ziplist_entries == 0 ||
            server.zset_max_ziplist_value < sdslen(c->argv[scoreidx+1]->ptr))
        {
            zobj = createZsetObject();
        } else {
            zobj = createZsetZiplistObject();
        }
        dbAdd(c->db,key,zobj);
    } else {
        if (zobj->type != OBJ_ZSET) {
            unlockDb(c->db);
            if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
            addReply(c,shared.wrongtypeerr);
            goto cleanup;
        }
    }

    for (j = 0; j < elements; j++) {
        score = scores[j];

        if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
            unsigned char *eptr;

            /* Prefer non-encoded element when dealing with ziplists. */
            ele = c->argv[scoreidx+1+j*2];
            if ((eptr = zzlFind(zobj->ptr,ele,&curscore)) != NULL) {
                if (nx) continue;
                if (incr) {
                    score += curscore;
                    if (isnan(score)) {
                        unlockDb(c->db);
                        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
                        addReplyError(c,nanerr);
                        goto cleanup;
                    }
                }

                /* Remove and re-insert when score changed. */
                if (score != curscore) {
                    zobj->ptr = zzlDelete(zobj->ptr,eptr);
                    zobj->ptr = zzlInsert(zobj->ptr,ele,score);
                    c->vel->dirty++;
                    updated++;
                }
                processed++;
            } else if (!xx) {
                /* Optimize: check if the element is too large or the list
                 * becomes too long *before* executing zzlInsert. */
                zobj->ptr = zzlInsert(zobj->ptr,ele,score);
                if (zzlLength(zobj->ptr) > server.zset_max_ziplist_entries)
                    zsetConvert(zobj,OBJ_ENCODING_SKIPLIST);
                if (sdslen(ele->ptr) > server.zset_max_ziplist_value)
                    zsetConvert(zobj,OBJ_ENCODING_SKIPLIST);
                c->vel->dirty++;
                added++;
                processed++;
            }
        } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
            zset *zs = zobj->ptr;
            zskiplistNode *znode;
            dictEntry *de;

            ele = c->argv[scoreidx+1+j*2] =
                tryObjectEncoding(c->argv[scoreidx+1+j*2]);
            de = dictFind(zs->dict,ele);
            if (de != NULL) {
                if (nx) continue;
                curobj = dictGetKey(de);
                curscore = *(double*)dictGetVal(de);

                if (incr) {
                    score += curscore;
                    if (isnan(score)) {
                        unlockDb(c->db);
                        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
                        addReplyError(c,nanerr);
                        /* Don't need to check if the sorted set is empty
                         * because we know it has at least one element. */
                        goto cleanup;
                    }
                }

                /* Remove and re-insert when score changed. We can safely
                 * delete the key object from the skiplist, since the
                 * dictionary still has a reference to it. */
                if (score != curscore) {
                    serverAssertWithInfo(c,curobj,zslDelete(zs->zsl,curscore,curobj));
                    znode = zslInsert(zs->zsl,score,curobj);
                    dictGetVal(de) = &znode->score; /* Update score ptr. */
                    c->vel->dirty++;
                    updated++;
                }
                processed++;
            } else if (!xx) {
                ele = dupStringObjectUnconstant(ele);
                znode = zslInsert(zs->zsl,score,ele);
                serverAssertWithInfo(c,NULL,dictAdd(zs->dict,ele,&znode->score) == DICT_OK);
                c->vel->dirty++;
                added++;
                processed++;
            }
        } else {
            serverPanic("Unknown sorted set encoding");
        }
    }

    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);

reply_to_client:
    if (incr) { /* ZINCRBY or INCR option. */
        if (processed)
            addReplyDouble(c,score);
        else
            addReply(c,shared.nullbulk);
    } else { /* ZADD. */
        addReplyLongLong(c,ch ? added+updated : added);
    }

cleanup:
    dfree(scores);
    if (added || updated) {
        signalModifiedKey(c->db,key);
        notifyKeyspaceEvent(NOTIFY_ZSET,
            incr ? "zincr" : "zadd", key, c->db->id);
    }
}

void zaddCommand(client *c) {
    zaddGenericCommand(c,ZADD_NONE);
}

void zincrbyCommand(client *c) {
    zaddGenericCommand(c,ZADD_INCR);
}

void zremCommand(client *c) {
    robj *key = c->argv[1];
    robj *zobj;
    int deleted = 0, keyremoved = 0, j;
    int expired = 0;

    fetchInternalDbByKey(c, key);
    lockDbWrite(c->db);
    if ((zobj = lookupKeyWriteOrReply(c,key,shared.czero,&expired)) == NULL ||
        checkType(c,zobj,OBJ_ZSET)) {
        unlockDb(c->db);
        if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
        return;
    }

    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *eptr;

        for (j = 2; j < c->argc; j++) {
            if ((eptr = zzlFind(zobj->ptr,c->argv[j],NULL)) != NULL) {
                deleted++;
                zobj->ptr = zzlDelete(zobj->ptr,eptr);
                if (zzlLength(zobj->ptr) == 0) {
                    dbDelete(c->db,key);
                    keyremoved = 1;
                    break;
                }
            }
        }
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = zobj->ptr;
        dictEntry *de;
        double score;

        for (j = 2; j < c->argc; j++) {
            de = dictFind(zs->dict,c->argv[j]);
            if (de != NULL) {
                deleted++;

                /* Delete from the skiplist */
                score = *(double*)dictGetVal(de);
                serverAssertWithInfo(c,c->argv[j],zslDelete(zs->zsl,score,c->argv[j]));

                /* Delete from the hash table */
                dictDelete(zs->dict,c->argv[j]);
                if (htNeedsResize(zs->dict)) dictResize(zs->dict);
                if (dictSize(zs->dict) == 0) {
                    dbDelete(c->db,key);
                    keyremoved = 1;
                    break;
                }
            }
        }
    } else {
        serverPanic("Unknown sorted set encoding");
    }

    if (deleted) {
        notifyKeyspaceEvent(NOTIFY_ZSET,"zrem",key,c->db->id);
        if (keyremoved)
            notifyKeyspaceEvent(NOTIFY_GENERIC,"del",key,c->db->id);
        signalModifiedKey(c->db,key);
        c->vel->dirty += deleted;
    }
    addReplyLongLong(c,deleted);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

/* Implements ZREMRANGEBYRANK, ZREMRANGEBYSCORE, ZREMRANGEBYLEX commands. */
#define ZRANGE_RANK 0
#define ZRANGE_SCORE 1
#define ZRANGE_LEX 2
void zremrangeGenericCommand(client *c, int rangetype) {
    robj *key = c->argv[1];
    robj *zobj;
    int keyremoved = 0;
    unsigned long deleted = 0;
    zrangespec range;
    zlexrangespec lexrange;
    long start, end, llen;
    int expired = 0;

    /* Step 1: Parse the range. */
    if (rangetype == ZRANGE_RANK) {
        if ((getLongFromObjectOrReply(c,c->argv[2],&start,NULL) != VR_OK) ||
            (getLongFromObjectOrReply(c,c->argv[3],&end,NULL) != VR_OK))
            return;
    } else if (rangetype == ZRANGE_SCORE) {
        if (zslParseRange(c->argv[2],c->argv[3],&range) != VR_OK) {
            addReplyError(c,"min or max is not a float");
            return;
        }
    } else if (rangetype == ZRANGE_LEX) {
        if (zslParseLexRange(c->argv[2],c->argv[3],&lexrange) != VR_OK) {
            addReplyError(c,"min or max not valid string range item");
            return;
        }
    }

    fetchInternalDbByKey(c, key);
    lockDbWrite(c->db);
    /* Step 2: Lookup & range sanity checks if needed. */
    if ((zobj = lookupKeyWriteOrReply(c,key,shared.czero,&expired)) == NULL ||
        checkType(c,zobj,OBJ_ZSET)) goto cleanup;

    if (rangetype == ZRANGE_RANK) {
        /* Sanitize indexes. */
        llen = zsetLength(zobj);
        if (start < 0) start = llen+start;
        if (end < 0) end = llen+end;
        if (start < 0) start = 0;

        /* Invariant: start >= 0, so this test will be true when end < 0.
         * The range is empty when start > end or start >= length. */
        if (start > end || start >= llen) {
            addReply(c,shared.czero);
            goto cleanup;
        }
        if (end >= llen) end = llen-1;
    }

    /* Step 3: Perform the range deletion operation. */
    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        switch(rangetype) {
        case ZRANGE_RANK:
            zobj->ptr = zzlDeleteRangeByRank(zobj->ptr,start+1,end+1,&deleted);
            break;
        case ZRANGE_SCORE:
            zobj->ptr = zzlDeleteRangeByScore(zobj->ptr,&range,&deleted);
            break;
        case ZRANGE_LEX:
            zobj->ptr = zzlDeleteRangeByLex(zobj->ptr,&lexrange,&deleted);
            break;
        }
        if (zzlLength(zobj->ptr) == 0) {
            dbDelete(c->db,key);
            keyremoved = 1;
        }
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = zobj->ptr;
        switch(rangetype) {
        case ZRANGE_RANK:
            deleted = zslDeleteRangeByRank(zs->zsl,start+1,end+1,zs->dict);
            break;
        case ZRANGE_SCORE:
            deleted = zslDeleteRangeByScore(zs->zsl,&range,zs->dict);
            break;
        case ZRANGE_LEX:
            deleted = zslDeleteRangeByLex(zs->zsl,&lexrange,zs->dict);
            break;
        }
        if (htNeedsResize(zs->dict)) dictResize(zs->dict);
        if (dictSize(zs->dict) == 0) {
            dbDelete(c->db,key);
            keyremoved = 1;
        }
    } else {
        serverPanic("Unknown sorted set encoding");
    }

    /* Step 4: Notifications and reply. */
    if (deleted) {
        char *event[3] = {"zremrangebyrank","zremrangebyscore","zremrangebylex"};
        signalModifiedKey(c->db,key);
        notifyKeyspaceEvent(NOTIFY_ZSET,event[rangetype],key,c->db->id);
        if (keyremoved)
            notifyKeyspaceEvent(NOTIFY_GENERIC,"del",key,c->db->id);
    }
    c->vel->dirty += deleted;
    addReplyLongLong(c,deleted);

cleanup:
    if (rangetype == ZRANGE_LEX) zslFreeLexRange(&lexrange);
    unlockDb(c->db);
    if (expired) update_stats_add(c->vel->stats,expiredkeys,1);
}

void zremrangebyrankCommand(client *c) {
    zremrangeGenericCommand(c,ZRANGE_RANK);
}

void zremrangebyscoreCommand(client *c) {
    zremrangeGenericCommand(c,ZRANGE_SCORE);
}

void zremrangebylexCommand(client *c) {
    zremrangeGenericCommand(c,ZRANGE_LEX);
}

/* Use dirty flags for pointers that need to be cleaned up in the next
 * iteration over the zsetopval. The dirty flag for the long long value is
 * special, since long long values don't need cleanup. Instead, it means that
 * we already checked that "ell" holds a long long, or tried to convert another
 * representation into a long long value. When this was successful,
 * OPVAL_VALID_LL is set as well. */
#define OPVAL_DIRTY_ROBJ 1
#define OPVAL_DIRTY_LL 2
#define OPVAL_VALID_LL 4

typedef union _iterset iterset;
typedef union _iterzset iterzset;

void zuiInitIterator(zsetopsrc *op) {
    if (op->subject == NULL)
        return;

    if (op->type == OBJ_SET) {
        iterset *it = &op->iter.set;
        if (op->encoding == OBJ_ENCODING_INTSET) {
            it->is.is = op->subject->ptr;
            it->is.ii = 0;
        } else if (op->encoding == OBJ_ENCODING_HT) {
            it->ht.dict = op->subject->ptr;
            it->ht.di = dictGetIterator(op->subject->ptr);
            it->ht.de = dictNext(it->ht.di);
        } else {
            serverPanic("Unknown set encoding");
        }
    } else if (op->type == OBJ_ZSET) {
        iterzset *it = &op->iter.zset;
        if (op->encoding == OBJ_ENCODING_ZIPLIST) {
            it->zl.zl = op->subject->ptr;
            it->zl.eptr = ziplistIndex(it->zl.zl,0);
            if (it->zl.eptr != NULL) {
                it->zl.sptr = ziplistNext(it->zl.zl,it->zl.eptr);
                ASSERT(it->zl.sptr != NULL);
            }
        } else if (op->encoding == OBJ_ENCODING_SKIPLIST) {
            it->sl.zs = op->subject->ptr;
            it->sl.node = it->sl.zs->zsl->header->level[0].forward;
        } else {
            serverPanic("Unknown sorted set encoding");
        }
    } else {
        serverPanic("Unsupported type");
    }
}

void zuiClearIterator(zsetopsrc *op) {
    if (op->subject == NULL)
        return;

    if (op->type == OBJ_SET) {
        iterset *it = &op->iter.set;
        if (op->encoding == OBJ_ENCODING_INTSET) {
            UNUSED(it); /* skip */
        } else if (op->encoding == OBJ_ENCODING_HT) {
            dictReleaseIterator(it->ht.di);
        } else {
            serverPanic("Unknown set encoding");
        }
    } else if (op->type == OBJ_ZSET) {
        iterzset *it = &op->iter.zset;
        if (op->encoding == OBJ_ENCODING_ZIPLIST) {
            UNUSED(it); /* skip */
        } else if (op->encoding == OBJ_ENCODING_SKIPLIST) {
            UNUSED(it); /* skip */
        } else {
            serverPanic("Unknown sorted set encoding");
        }
    } else {
        serverPanic("Unsupported type");
    }
}

int zuiLength(zsetopsrc *op) {
    if (op->subject == NULL)
        return 0;

    if (op->type == OBJ_SET) {
        if (op->encoding == OBJ_ENCODING_INTSET) {
            return intsetLen(op->subject->ptr);
        } else if (op->encoding == OBJ_ENCODING_HT) {
            dict *ht = op->subject->ptr;
            return dictSize(ht);
        } else {
            serverPanic("Unknown set encoding");
        }
    } else if (op->type == OBJ_ZSET) {
        if (op->encoding == OBJ_ENCODING_ZIPLIST) {
            return zzlLength(op->subject->ptr);
        } else if (op->encoding == OBJ_ENCODING_SKIPLIST) {
            zset *zs = op->subject->ptr;
            return zs->zsl->length;
        } else {
            serverPanic("Unknown sorted set encoding");
        }
    } else {
        serverPanic("Unsupported type");
    }
}

/* Check if the current value is valid. If so, store it in the passed structure
 * and move to the next element. If not valid, this means we have reached the
 * end of the structure and can abort. */
int zuiNext(zsetopsrc *op, zsetopval *val) {
    int ret;
    
    if (op->subject == NULL)
        return 0;

    if (val->flags & OPVAL_DIRTY_ROBJ)
        decrRefCount(val->ele);

    memset(val,0,sizeof(zsetopval));

    if (op->type == OBJ_SET) {
        iterset *it = &op->iter.set;
        if (op->encoding == OBJ_ENCODING_INTSET) {
            int64_t ell;

            if (!intsetGet(it->is.is,it->is.ii,&ell))
                return 0;
            val->ell = ell;
            val->score = 1.0;

            /* Move to next element. */
            it->is.ii++;
        } else if (op->encoding == OBJ_ENCODING_HT) {
            if (it->ht.de == NULL)
                return 0;
            val->ele = dictGetKey(it->ht.de);
            val->score = 1.0;

            /* Move to next element. */
            it->ht.de = dictNext(it->ht.di);
        } else {
            serverPanic("Unknown set encoding");
        }
    } else if (op->type == OBJ_ZSET) {
        iterzset *it = &op->iter.zset;
        if (op->encoding == OBJ_ENCODING_ZIPLIST) {
            /* No need to check both, but better be explicit. */
            if (it->zl.eptr == NULL || it->zl.sptr == NULL)
                return 0;
            ret = (int) ziplistGet(it->zl.eptr,&val->estr,&val->elen,&val->ell);
            ASSERT(ret > 0);
            val->score = zzlGetScore(it->zl.sptr);

            /* Move to next element. */
            zzlNext(it->zl.zl,&it->zl.eptr,&it->zl.sptr);
        } else if (op->encoding == OBJ_ENCODING_SKIPLIST) {
            if (it->sl.node == NULL)
                return 0;
            val->ele = it->sl.node->obj;
            val->score = it->sl.node->score;

            /* Move to next element. */
            it->sl.node = it->sl.node->level[0].forward;
        } else {
            serverPanic("Unknown sorted set encoding");
        }
    } else {
        serverPanic("Unsupported type");
    }
    return 1;
}

int zuiLongLongFromValue(zsetopval *val) {
    if (!(val->flags & OPVAL_DIRTY_LL)) {
        val->flags |= OPVAL_DIRTY_LL;

        if (val->ele != NULL) {
            if (val->ele->encoding == OBJ_ENCODING_INT) {
                val->ell = (long)val->ele->ptr;
                val->flags |= OPVAL_VALID_LL;
            } else if (sdsEncodedObject(val->ele)) {
                if (string2ll(val->ele->ptr,sdslen(val->ele->ptr),&val->ell))
                    val->flags |= OPVAL_VALID_LL;
            } else {
                serverPanic("Unsupported element encoding");
            }
        } else if (val->estr != NULL) {
            if (string2ll((char*)val->estr,val->elen,&val->ell))
                val->flags |= OPVAL_VALID_LL;
        } else {
            /* The long long was already set, flag as valid. */
            val->flags |= OPVAL_VALID_LL;
        }
    }
    return val->flags & OPVAL_VALID_LL;
}

robj *zuiObjectFromValue(zsetopval *val) {
    if (val->ele == NULL) {
        if (val->estr != NULL) {
            val->ele = createStringObject((char*)val->estr,val->elen);
        } else {
            val->ele = createStringObjectFromLongLong(val->ell);
        }
        val->flags |= OPVAL_DIRTY_ROBJ;
    }
    return val->ele;
}

int zuiBufferFromValue(zsetopval *val) {
    if (val->estr == NULL) {
        if (val->ele != NULL) {
            if (val->ele->encoding == OBJ_ENCODING_INT) {
                val->elen = ll2string((char*)val->_buf,sizeof(val->_buf),(long)val->ele->ptr);
                val->estr = val->_buf;
            } else if (sdsEncodedObject(val->ele)) {
                val->elen = sdslen(val->ele->ptr);
                val->estr = val->ele->ptr;
            } else {
                serverPanic("Unsupported element encoding");
            }
        } else {
            val->elen = ll2string((char*)val->_buf,sizeof(val->_buf),val->ell);
            val->estr = val->_buf;
        }
    }
    return 1;
}

/* Find value pointed to by val in the source pointer to by op. When found,
 * return 1 and store its score in target. Return 0 otherwise. */
int zuiFind(zsetopsrc *op, zsetopval *val, double *score) {
    if (op->subject == NULL)
        return 0;

    if (op->type == OBJ_SET) {
        if (op->encoding == OBJ_ENCODING_INTSET) {
            if (zuiLongLongFromValue(val) &&
                intsetFind(op->subject->ptr,val->ell))
            {
                *score = 1.0;
                return 1;
            } else {
                return 0;
            }
        } else if (op->encoding == OBJ_ENCODING_HT) {
            dict *ht = op->subject->ptr;
            zuiObjectFromValue(val);
            if (dictFind(ht,val->ele) != NULL) {
                *score = 1.0;
                return 1;
            } else {
                return 0;
            }
        } else {
            serverPanic("Unknown set encoding");
        }
    } else if (op->type == OBJ_ZSET) {
        zuiObjectFromValue(val);

        if (op->encoding == OBJ_ENCODING_ZIPLIST) {
            if (zzlFind(op->subject->ptr,val->ele,score) != NULL) {
                /* Score is already set by zzlFind. */
                return 1;
            } else {
                return 0;
            }
        } else if (op->encoding == OBJ_ENCODING_SKIPLIST) {
            zset *zs = op->subject->ptr;
            dictEntry *de;
            if ((de = dictFind(zs->dict,val->ele)) != NULL) {
                *score = *(double*)dictGetVal(de);
                return 1;
            } else {
                return 0;
            }
        } else {
            serverPanic("Unknown sorted set encoding");
        }
    } else {
        serverPanic("Unsupported type");
    }
}

int zuiCompareByCardinality(const void *s1, const void *s2) {
    return zuiLength((zsetopsrc*)s1) - zuiLength((zsetopsrc*)s2);
}

#define REDIS_AGGR_SUM 1
#define REDIS_AGGR_MIN 2
#define REDIS_AGGR_MAX 3
#define zunionInterDictValue(_e) (dictGetVal(_e) == NULL ? 1.0 : *(double*)dictGetVal(_e))

inline static void zunionInterAggregate(double *target, double val, int aggregate) {
    if (aggregate == REDIS_AGGR_SUM) {
        *target = *target + val;
        /* The result of adding two doubles is NaN when one variable
         * is +inf and the other is -inf. When these numbers are added,
         * we maintain the convention of the result being 0.0. */
        if (isnan(*target)) *target = 0.0;
    } else if (aggregate == REDIS_AGGR_MIN) {
        *target = val < *target ? val : *target;
    } else if (aggregate == REDIS_AGGR_MAX) {
        *target = val > *target ? val : *target;
    } else {
        /* safety net */
        serverPanic("Unknown ZUNION/INTER aggregate type");
    }
}

#define SET_OP_UNION 0
#define SET_OP_DIFF 1
#define SET_OP_INTER 2

void zunionInterGenericCommand(client *c, robj *dstkey, int op) {
    int i, j;
    long setnum;
    int aggregate = REDIS_AGGR_SUM;
    zsetopsrc *src;
    zsetopval zval;
    robj *tmp;
    unsigned int maxelelen = 0;
    robj *dstobj;
    zset *dstzset;
    zskiplistNode *znode;
    int touched = 0;

    /* expect setnum input keys to be given */
    if ((getLongFromObjectOrReply(c, c->argv[2], &setnum, NULL) != VR_OK))
        return;

    if (setnum < 1) {
        addReplyError(c,
            "at least 1 input key is needed for ZUNIONSTORE/ZINTERSTORE");
        return;
    }

    /* test if the expected number of keys would overflow */
    if (setnum > c->argc-3) {
        addReply(c,shared.syntaxerr);
        return;
    }

    /* read keys to be used for input */
    src = dcalloc(setnum, sizeof(zsetopsrc));
    for (i = 0, j = 3; i < setnum; i++, j++) {
        robj *obj = lookupKeyWrite(c->db,c->argv[j],NULL);
        if (obj != NULL) {
            if (obj->type != OBJ_ZSET && obj->type != OBJ_SET) {
                dfree(src);
                addReply(c,shared.wrongtypeerr);
                return;
            }

            src[i].subject = obj;
            src[i].type = obj->type;
            src[i].encoding = obj->encoding;
        } else {
            src[i].subject = NULL;
        }

        /* Default all weights to 1. */
        src[i].weight = 1.0;
    }

    /* parse optional extra arguments */
    if (j < c->argc) {
        int remaining = c->argc - j;

        while (remaining) {
            if (remaining >= (setnum + 1) && !strcasecmp(c->argv[j]->ptr,"weights")) {
                j++; remaining--;
                for (i = 0; i < setnum; i++, j++, remaining--) {
                    if (getDoubleFromObjectOrReply(c,c->argv[j],&src[i].weight,
                            "weight value is not a float") != VR_OK)
                    {
                        dfree(src);
                        return;
                    }
                }
            } else if (remaining >= 2 && !strcasecmp(c->argv[j]->ptr,"aggregate")) {
                j++; remaining--;
                if (!strcasecmp(c->argv[j]->ptr,"sum")) {
                    aggregate = REDIS_AGGR_SUM;
                } else if (!strcasecmp(c->argv[j]->ptr,"min")) {
                    aggregate = REDIS_AGGR_MIN;
                } else if (!strcasecmp(c->argv[j]->ptr,"max")) {
                    aggregate = REDIS_AGGR_MAX;
                } else {
                    dfree(src);
                    addReply(c,shared.syntaxerr);
                    return;
                }
                j++; remaining--;
            } else {
                dfree(src);
                addReply(c,shared.syntaxerr);
                return;
            }
        }
    }

    /* sort sets from the smallest to largest, this will improve our
     * algorithm's performance */
    qsort(src,setnum,sizeof(zsetopsrc),zuiCompareByCardinality);

    dstobj = createZsetObject();
    dstzset = dstobj->ptr;
    memset(&zval, 0, sizeof(zval));

    if (op == SET_OP_INTER) {
        /* Skip everything if the smallest input is empty. */
        if (zuiLength(&src[0]) > 0) {
            /* Precondition: as src[0] is non-empty and the inputs are ordered
             * by size, all src[i > 0] are non-empty too. */
            zuiInitIterator(&src[0]);
            while (zuiNext(&src[0],&zval)) {
                double score, value;

                score = src[0].weight * zval.score;
                if (isnan(score)) score = 0;

                for (j = 1; j < setnum; j++) {
                    /* It is not safe to access the zset we are
                     * iterating, so explicitly check for equal object. */
                    if (src[j].subject == src[0].subject) {
                        value = zval.score*src[j].weight;
                        zunionInterAggregate(&score,value,aggregate);
                    } else if (zuiFind(&src[j],&zval,&value)) {
                        value *= src[j].weight;
                        zunionInterAggregate(&score,value,aggregate);
                    } else {
                        break;
                    }
                }

                /* Only continue when present in every input. */
                if (j == setnum) {
                    tmp = zuiObjectFromValue(&zval);
                    znode = zslInsert(dstzset->zsl,score,tmp);
                    incrRefCount(tmp); /* added to skiplist */
                    dictAdd(dstzset->dict,tmp,&znode->score);
                    incrRefCount(tmp); /* added to dictionary */

                    if (sdsEncodedObject(tmp)) {
                        if (sdslen(tmp->ptr) > maxelelen)
                            maxelelen = sdslen(tmp->ptr);
                    }
                }
            }
            zuiClearIterator(&src[0]);
        }
    } else if (op == SET_OP_UNION) {
        dict *accumulator = dictCreate(&setDictType,NULL);
        dictIterator *di;
        dictEntry *de;
        double score;

        if (setnum) {
            /* Our union is at least as large as the largest set.
             * Resize the dictionary ASAP to avoid useless rehashing. */
            dictExpand(accumulator,zuiLength(&src[setnum-1]));
        }

        /* Step 1: Create a dictionary of elements -> aggregated-scores
         * by iterating one sorted set after the other. */
        for (i = 0; i < setnum; i++) {
            if (zuiLength(&src[i]) == 0) continue;

            zuiInitIterator(&src[i]);
            while (zuiNext(&src[i],&zval)) {
                /* Initialize value */
                score = src[i].weight * zval.score;
                if (isnan(score)) score = 0;

                /* Search for this element in the accumulating dictionary. */
                de = dictFind(accumulator,zuiObjectFromValue(&zval));
                /* If we don't have it, we need to create a new entry. */
                if (de == NULL) {
                    tmp = zuiObjectFromValue(&zval);
                    /* Remember the longest single element encountered,
                     * to understand if it's possible to convert to ziplist
                     * at the end. */
                    if (sdsEncodedObject(tmp)) {
                        if (sdslen(tmp->ptr) > maxelelen)
                            maxelelen = sdslen(tmp->ptr);
                    }
                    /* Add the element with its initial score. */
                    de = dictAddRaw(accumulator,tmp);
                    incrRefCount(tmp);
                    dictSetDoubleVal(de,score);
                } else {
                    /* Update the score with the score of the new instance
                     * of the element found in the current sorted set.
                     *
                     * Here we access directly the dictEntry double
                     * value inside the union as it is a big speedup
                     * compared to using the getDouble/setDouble API. */
                    zunionInterAggregate(&de->v.d,score,aggregate);
                }
            }
            zuiClearIterator(&src[i]);
        }

        /* Step 2: convert the dictionary into the final sorted set. */
        di = dictGetIterator(accumulator);

        /* We now are aware of the final size of the resulting sorted set,
         * let's resize the dictionary embedded inside the sorted set to the
         * right size, in order to save rehashing time. */
        dictExpand(dstzset->dict,dictSize(accumulator));

        while((de = dictNext(di)) != NULL) {
            robj *ele = dictGetKey(de);
            score = dictGetDoubleVal(de);
            znode = zslInsert(dstzset->zsl,score,ele);
            incrRefCount(ele); /* added to skiplist */
            dictAdd(dstzset->dict,ele,&znode->score);
            incrRefCount(ele); /* added to dictionary */
        }
        dictReleaseIterator(di);

        /* We can free the accumulator dictionary now. */
        dictRelease(accumulator);
    } else {
        serverPanic("Unknown operator");
    }

    if (dbDelete(c->db,dstkey)) {
        signalModifiedKey(c->db,dstkey);
        touched = 1;
        server.dirty++;
    }
    if (dstzset->zsl->length) {
        zsetConvertToZiplistIfNeeded(dstobj,maxelelen);
        dbAdd(c->db,dstkey,dstobj);
        addReplyLongLong(c,zsetLength(dstobj));
        if (!touched) signalModifiedKey(c->db,dstkey);
        notifyKeyspaceEvent(NOTIFY_ZSET,
            (op == SET_OP_UNION) ? "zunionstore" : "zinterstore",
            dstkey,c->db->id);
        server.dirty++;
    } else {
        decrRefCount(dstobj);
        addReply(c,shared.czero);
        if (touched)
            notifyKeyspaceEvent(NOTIFY_GENERIC,"del",dstkey,c->db->id);
    }
    dfree(src);
}

void zunionstoreCommand(client *c) {
    zunionInterGenericCommand(c,c->argv[1], SET_OP_UNION);
}

void zinterstoreCommand(client *c) {
    zunionInterGenericCommand(c,c->argv[1], SET_OP_INTER);
}

void zrangeGenericCommand(client *c, int reverse) {
    robj *key = c->argv[1];
    robj *zobj;
    int withscores = 0;
    long start;
    long end;
    int llen;
    int rangelen;

    if ((getLongFromObjectOrReply(c, c->argv[2], &start, NULL) != VR_OK) ||
        (getLongFromObjectOrReply(c, c->argv[3], &end, NULL) != VR_OK)) return;

    if (c->argc == 5 && !strcasecmp(c->argv[4]->ptr,"withscores")) {
        withscores = 1;
    } else if (c->argc >= 5) {
        addReply(c,shared.syntaxerr);
        return;
    }

    fetchInternalDbByKey(c, key);
    lockDbRead(c->db);
    if ((zobj = lookupKeyReadOrReply(c,key,shared.emptymultibulk)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,zobj,OBJ_ZSET)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    /* Sanitize indexes. */
    llen = zsetLength(zobj);
    if (start < 0) start = llen+start;
    if (end < 0) end = llen+end;
    if (start < 0) start = 0;

    /* Invariant: start >= 0, so this test will be true when end < 0.
     * The range is empty when start > end or start >= length. */
    if (start > end || start >= llen) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        addReply(c,shared.emptymultibulk);
        return;
    }
    if (end >= llen) end = llen-1;
    rangelen = (end-start)+1;

    /* Return the result in form of a multi-bulk reply */
    addReplyMultiBulkLen(c, withscores ? (rangelen*2) : rangelen);

    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl = zobj->ptr;
        unsigned char *eptr, *sptr;
        unsigned char *vstr;
        unsigned int vlen;
        long long vlong;

        if (reverse)
            eptr = ziplistIndex(zl,-2-(2*start));
        else
            eptr = ziplistIndex(zl,2*start);

        serverAssertWithInfo(c,zobj,eptr != NULL);
        sptr = ziplistNext(zl,eptr);

        while (rangelen--) {
            serverAssertWithInfo(c,zobj,eptr != NULL && sptr != NULL);
            serverAssertWithInfo(c,zobj,ziplistGet(eptr,&vstr,&vlen,&vlong));
            if (vstr == NULL)
                addReplyBulkLongLong(c,vlong);
            else
                addReplyBulkCBuffer(c,vstr,vlen);

            if (withscores)
                addReplyDouble(c,zzlGetScore(sptr));

            if (reverse)
                zzlPrev(zl,&eptr,&sptr);
            else
                zzlNext(zl,&eptr,&sptr);
        }

    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = zobj->ptr;
        zskiplist *zsl = zs->zsl;
        zskiplistNode *ln;
        robj *ele;

        /* Check if starting point is trivial, before doing log(N) lookup. */
        if (reverse) {
            ln = zsl->tail;
            if (start > 0)
                ln = zslGetElementByRank(zsl,llen-start);
        } else {
            ln = zsl->header->level[0].forward;
            if (start > 0)
                ln = zslGetElementByRank(zsl,start+1);
        }

        while(rangelen--) {
            serverAssertWithInfo(c,zobj,ln != NULL);
            ele = ln->obj;
            addReplyBulk(c,ele);
            if (withscores)
                addReplyDouble(c,ln->score);
            ln = reverse ? ln->backward : ln->level[0].forward;
        }
    } else {
        serverPanic("Unknown sorted set encoding");
    }

    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void zrangeCommand(client *c) {
    zrangeGenericCommand(c,0);
}

void zrevrangeCommand(client *c) {
    zrangeGenericCommand(c,1);
}

/* This command implements ZRANGEBYSCORE, ZREVRANGEBYSCORE. */
void genericZrangebyscoreCommand(client *c, int reverse) {
    zrangespec range;
    robj *key = c->argv[1];
    robj *zobj;
    long offset = 0, limit = -1;
    int withscores = 0;
    unsigned long rangelen = 0;
    void *replylen = NULL;
    int minidx, maxidx;

    /* Parse the range arguments. */
    if (reverse) {
        /* Range is given as [max,min] */
        maxidx = 2; minidx = 3;
    } else {
        /* Range is given as [min,max] */
        minidx = 2; maxidx = 3;
    }

    if (zslParseRange(c->argv[minidx],c->argv[maxidx],&range) != VR_OK) {
        addReplyError(c,"min or max is not a float");
        return;
    }

    /* Parse optional extra arguments. Note that ZCOUNT will exactly have
     * 4 arguments, so we'll never enter the following code path. */
    if (c->argc > 4) {
        int remaining = c->argc - 4;
        int pos = 4;

        while (remaining) {
            if (remaining >= 1 && !strcasecmp(c->argv[pos]->ptr,"withscores")) {
                pos++; remaining--;
                withscores = 1;
            } else if (remaining >= 3 && !strcasecmp(c->argv[pos]->ptr,"limit")) {
                if ((getLongFromObjectOrReply(c, c->argv[pos+1], &offset, NULL) != VR_OK) ||
                    (getLongFromObjectOrReply(c, c->argv[pos+2], &limit, NULL) != VR_OK)) return;
                pos += 3; remaining -= 3;
            } else {
                addReply(c,shared.syntaxerr);
                return;
            }
        }
    }

    fetchInternalDbByKey(c, key);
    lockDbRead(c->db);
    /* Ok, lookup the key and get the range */
    if ((zobj = lookupKeyReadOrReply(c,key,shared.emptymultibulk)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,zobj,OBJ_ZSET)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl = zobj->ptr;
        unsigned char *eptr, *sptr;
        unsigned char *vstr;
        unsigned int vlen;
        long long vlong;
        double score;

        /* If reversed, get the last node in range as starting point. */
        if (reverse) {
            eptr = zzlLastInRange(zl,&range);
        } else {
            eptr = zzlFirstInRange(zl,&range);
        }

        /* No "first" element in the specified interval. */
        if (eptr == NULL) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            addReply(c, shared.emptymultibulk);
            return;
        }

        /* Get score pointer for the first element. */
        serverAssertWithInfo(c,zobj,eptr != NULL);
        sptr = ziplistNext(zl,eptr);

        /* We don't know in advance how many matching elements there are in the
         * list, so we push this object that will represent the multi-bulk
         * length in the output buffer, and will "fix" it later */
        replylen = addDeferredMultiBulkLength(c);

        /* If there is an offset, just traverse the number of elements without
         * checking the score because that is done in the next loop. */
        while (eptr && offset--) {
            if (reverse) {
                zzlPrev(zl,&eptr,&sptr);
            } else {
                zzlNext(zl,&eptr,&sptr);
            }
        }

        while (eptr && limit--) {
            score = zzlGetScore(sptr);

            /* Abort when the node is no longer in range. */
            if (reverse) {
                if (!zslValueGteMin(score,&range)) break;
            } else {
                if (!zslValueLteMax(score,&range)) break;
            }

            /* We know the element exists, so ziplistGet should always succeed */
            serverAssertWithInfo(c,zobj,ziplistGet(eptr,&vstr,&vlen,&vlong));

            rangelen++;
            if (vstr == NULL) {
                addReplyBulkLongLong(c,vlong);
            } else {
                addReplyBulkCBuffer(c,vstr,vlen);
            }

            if (withscores) {
                addReplyDouble(c,score);
            }

            /* Move to next node */
            if (reverse) {
                zzlPrev(zl,&eptr,&sptr);
            } else {
                zzlNext(zl,&eptr,&sptr);
            }
        }
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = zobj->ptr;
        zskiplist *zsl = zs->zsl;
        zskiplistNode *ln;

        /* If reversed, get the last node in range as starting point. */
        if (reverse) {
            ln = zslLastInRange(zsl,&range);
        } else {
            ln = zslFirstInRange(zsl,&range);
        }

        /* No "first" element in the specified interval. */
        if (ln == NULL) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            addReply(c, shared.emptymultibulk);
            return;
        }

        /* We don't know in advance how many matching elements there are in the
         * list, so we push this object that will represent the multi-bulk
         * length in the output buffer, and will "fix" it later */
        replylen = addDeferredMultiBulkLength(c);

        /* If there is an offset, just traverse the number of elements without
         * checking the score because that is done in the next loop. */
        while (ln && offset--) {
            if (reverse) {
                ln = ln->backward;
            } else {
                ln = ln->level[0].forward;
            }
        }

        while (ln && limit--) {
            /* Abort when the node is no longer in range. */
            if (reverse) {
                if (!zslValueGteMin(ln->score,&range)) break;
            } else {
                if (!zslValueLteMax(ln->score,&range)) break;
            }

            rangelen++;
            addReplyBulk(c,ln->obj);

            if (withscores) {
                addReplyDouble(c,ln->score);
            }

            /* Move to next node */
            if (reverse) {
                ln = ln->backward;
            } else {
                ln = ln->level[0].forward;
            }
        }
    } else {
        serverPanic("Unknown sorted set encoding");
    }

    if (withscores) {
        rangelen *= 2;
    }

    setDeferredMultiBulkLength(c, replylen, rangelen);
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void zrangebyscoreCommand(client *c) {
    genericZrangebyscoreCommand(c,0);
}

void zrevrangebyscoreCommand(client *c) {
    genericZrangebyscoreCommand(c,1);
}

void zcountCommand(client *c) {
    robj *key = c->argv[1];
    robj *zobj;
    zrangespec range;
    int count = 0;

    /* Parse the range arguments */
    if (zslParseRange(c->argv[2],c->argv[3],&range) != VR_OK) {
        addReplyError(c,"min or max is not a float");
        return;
    }

    fetchInternalDbByKey(c, key);
    lockDbRead(c->db);
    /* Lookup the sorted set */
    if ((zobj = lookupKeyReadOrReply(c, key, shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c, zobj, OBJ_ZSET)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl = zobj->ptr;
        unsigned char *eptr, *sptr;
        double score;

        /* Use the first element in range as the starting point */
        eptr = zzlFirstInRange(zl,&range);

        /* No "first" element */
        if (eptr == NULL) {
            unlockDb(c->db);
            update_stats_add(c->vel->stats, keyspace_hits, 1);
            addReply(c, shared.czero);
            return;
        }

        /* First element is in range */
        sptr = ziplistNext(zl,eptr);
        score = zzlGetScore(sptr);
        serverAssertWithInfo(c,zobj,zslValueLteMax(score,&range));

        /* Iterate over elements in range */
        while (eptr) {
            score = zzlGetScore(sptr);

            /* Abort when the node is no longer in range. */
            if (!zslValueLteMax(score,&range)) {
                break;
            } else {
                count++;
                zzlNext(zl,&eptr,&sptr);
            }
        }
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = zobj->ptr;
        zskiplist *zsl = zs->zsl;
        zskiplistNode *zn;
        unsigned long rank;

        /* Find first element in range */
        zn = zslFirstInRange(zsl, &range);

        /* Use rank of first element, if any, to determine preliminary count */
        if (zn != NULL) {
            rank = zslGetRank(zsl, zn->score, zn->obj);
            count = (zsl->length - (rank - 1));

            /* Find last element in range */
            zn = zslLastInRange(zsl, &range);

            /* Use rank of last element, if any, to determine the actual count */
            if (zn != NULL) {
                rank = zslGetRank(zsl, zn->score, zn->obj);
                count -= (zsl->length - rank);
            }
        }
    } else {
        serverPanic("Unknown sorted set encoding");
    }

    addReplyLongLong(c, count);
    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void zlexcountCommand(client *c) {
    robj *key = c->argv[1];
    robj *zobj;
    zlexrangespec range;
    int count = 0;

    /* Parse the range arguments */
    if (zslParseLexRange(c->argv[2],c->argv[3],&range) != VR_OK) {
        addReplyError(c,"min or max not valid string range item");
        return;
    }

    /* Lookup the sorted set */
    if ((zobj = lookupKeyReadOrReply(c, key, shared.czero)) == NULL ||
        checkType(c, zobj, OBJ_ZSET))
    {
        zslFreeLexRange(&range);
        return;
    }

    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl = zobj->ptr;
        unsigned char *eptr, *sptr;

        /* Use the first element in range as the starting point */
        eptr = zzlFirstInLexRange(zl,&range);

        /* No "first" element */
        if (eptr == NULL) {
            zslFreeLexRange(&range);
            addReply(c, shared.czero);
            return;
        }

        /* First element is in range */
        sptr = ziplistNext(zl,eptr);
        serverAssertWithInfo(c,zobj,zzlLexValueLteMax(eptr,&range));

        /* Iterate over elements in range */
        while (eptr) {
            /* Abort when the node is no longer in range. */
            if (!zzlLexValueLteMax(eptr,&range)) {
                break;
            } else {
                count++;
                zzlNext(zl,&eptr,&sptr);
            }
        }
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = zobj->ptr;
        zskiplist *zsl = zs->zsl;
        zskiplistNode *zn;
        unsigned long rank;

        /* Find first element in range */
        zn = zslFirstInLexRange(zsl, &range);

        /* Use rank of first element, if any, to determine preliminary count */
        if (zn != NULL) {
            rank = zslGetRank(zsl, zn->score, zn->obj);
            count = (zsl->length - (rank - 1));

            /* Find last element in range */
            zn = zslLastInLexRange(zsl, &range);

            /* Use rank of last element, if any, to determine the actual count */
            if (zn != NULL) {
                rank = zslGetRank(zsl, zn->score, zn->obj);
                count -= (zsl->length - rank);
            }
        }
    } else {
        serverPanic("Unknown sorted set encoding");
    }

    zslFreeLexRange(&range);
    addReplyLongLong(c, count);
}

/* This command implements ZRANGEBYLEX, ZREVRANGEBYLEX. */
void genericZrangebylexCommand(client *c, int reverse) {
    zlexrangespec range;
    robj *key = c->argv[1];
    robj *zobj;
    long offset = 0, limit = -1;
    unsigned long rangelen = 0;
    void *replylen = NULL;
    int minidx, maxidx;

    /* Parse the range arguments. */
    if (reverse) {
        /* Range is given as [max,min] */
        maxidx = 2; minidx = 3;
    } else {
        /* Range is given as [min,max] */
        minidx = 2; maxidx = 3;
    }

    if (zslParseLexRange(c->argv[minidx],c->argv[maxidx],&range) != VR_OK) {
        addReplyError(c,"min or max not valid string range item");
        return;
    }

    /* Parse optional extra arguments. Note that ZCOUNT will exactly have
     * 4 arguments, so we'll never enter the following code path. */
    if (c->argc > 4) {
        int remaining = c->argc - 4;
        int pos = 4;

        while (remaining) {
            if (remaining >= 3 && !strcasecmp(c->argv[pos]->ptr,"limit")) {
                if ((getLongFromObjectOrReply(c, c->argv[pos+1], &offset, NULL) != VR_OK) ||
                    (getLongFromObjectOrReply(c, c->argv[pos+2], &limit, NULL) != VR_OK)) return;
                pos += 3; remaining -= 3;
            } else {
                zslFreeLexRange(&range);
                addReply(c,shared.syntaxerr);
                return;
            }
        }
    }

    /* Ok, lookup the key and get the range */
    if ((zobj = lookupKeyReadOrReply(c,key,shared.emptymultibulk)) == NULL ||
        checkType(c,zobj,OBJ_ZSET))
    {
        zslFreeLexRange(&range);
        return;
    }

    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl = zobj->ptr;
        unsigned char *eptr, *sptr;
        unsigned char *vstr;
        unsigned int vlen;
        long long vlong;

        /* If reversed, get the last node in range as starting point. */
        if (reverse) {
            eptr = zzlLastInLexRange(zl,&range);
        } else {
            eptr = zzlFirstInLexRange(zl,&range);
        }

        /* No "first" element in the specified interval. */
        if (eptr == NULL) {
            addReply(c, shared.emptymultibulk);
            zslFreeLexRange(&range);
            return;
        }

        /* Get score pointer for the first element. */
        serverAssertWithInfo(c,zobj,eptr != NULL);
        sptr = ziplistNext(zl,eptr);

        /* We don't know in advance how many matching elements there are in the
         * list, so we push this object that will represent the multi-bulk
         * length in the output buffer, and will "fix" it later */
        replylen = addDeferredMultiBulkLength(c);

        /* If there is an offset, just traverse the number of elements without
         * checking the score because that is done in the next loop. */
        while (eptr && offset--) {
            if (reverse) {
                zzlPrev(zl,&eptr,&sptr);
            } else {
                zzlNext(zl,&eptr,&sptr);
            }
        }

        while (eptr && limit--) {
            /* Abort when the node is no longer in range. */
            if (reverse) {
                if (!zzlLexValueGteMin(eptr,&range)) break;
            } else {
                if (!zzlLexValueLteMax(eptr,&range)) break;
            }

            /* We know the element exists, so ziplistGet should always
             * succeed. */
            serverAssertWithInfo(c,zobj,ziplistGet(eptr,&vstr,&vlen,&vlong));

            rangelen++;
            if (vstr == NULL) {
                addReplyBulkLongLong(c,vlong);
            } else {
                addReplyBulkCBuffer(c,vstr,vlen);
            }

            /* Move to next node */
            if (reverse) {
                zzlPrev(zl,&eptr,&sptr);
            } else {
                zzlNext(zl,&eptr,&sptr);
            }
        }
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = zobj->ptr;
        zskiplist *zsl = zs->zsl;
        zskiplistNode *ln;

        /* If reversed, get the last node in range as starting point. */
        if (reverse) {
            ln = zslLastInLexRange(zsl,&range);
        } else {
            ln = zslFirstInLexRange(zsl,&range);
        }

        /* No "first" element in the specified interval. */
        if (ln == NULL) {
            addReply(c, shared.emptymultibulk);
            zslFreeLexRange(&range);
            return;
        }

        /* We don't know in advance how many matching elements there are in the
         * list, so we push this object that will represent the multi-bulk
         * length in the output buffer, and will "fix" it later */
        replylen = addDeferredMultiBulkLength(c);

        /* If there is an offset, just traverse the number of elements without
         * checking the score because that is done in the next loop. */
        while (ln && offset--) {
            if (reverse) {
                ln = ln->backward;
            } else {
                ln = ln->level[0].forward;
            }
        }

        while (ln && limit--) {
            /* Abort when the node is no longer in range. */
            if (reverse) {
                if (!zslLexValueGteMin(ln->obj,&range)) break;
            } else {
                if (!zslLexValueLteMax(ln->obj,&range)) break;
            }

            rangelen++;
            addReplyBulk(c,ln->obj);

            /* Move to next node */
            if (reverse) {
                ln = ln->backward;
            } else {
                ln = ln->level[0].forward;
            }
        }
    } else {
        serverPanic("Unknown sorted set encoding");
    }

    zslFreeLexRange(&range);
    setDeferredMultiBulkLength(c, replylen, rangelen);
}

void zrangebylexCommand(client *c) {
    genericZrangebylexCommand(c,0);
}

void zrevrangebylexCommand(client *c) {
    genericZrangebylexCommand(c,1);
}

void zcardCommand(client *c) {
    robj *key = c->argv[1];
    robj *zobj;

    fetchInternalDbByKey(c, key);
    lockDbRead(c->db);
    if ((zobj = lookupKeyReadOrReply(c,key,shared.czero)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,zobj,OBJ_ZSET)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    
    addReplyLongLong(c,zsetLength(zobj));

    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void zscoreCommand(client *c) {
    robj *key = c->argv[1];
    robj *zobj;
    double score;

    fetchInternalDbByKey(c, key);
    lockDbRead(c->db);
    if ((zobj = lookupKeyReadOrReply(c,key,shared.nullbulk)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,zobj,OBJ_ZSET)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }

    if (zsetScore(zobj,c->argv[2],&score) == VR_ERROR) {
        addReply(c,shared.nullbulk);
    } else {
        addReplyDouble(c,score);
    }

    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void zrankGenericCommand(client *c, int reverse) {
    robj *key = c->argv[1];
    robj *ele = c->argv[2];
    robj *zobj;
    unsigned long llen;
    unsigned long rank;

    fetchInternalDbByKey(c, key);
    lockDbRead(c->db);
    if ((zobj = lookupKeyReadOrReply(c,key,shared.nullbulk)) == NULL) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_misses, 1);
        return;
    } else if (checkType(c,zobj,OBJ_ZSET)) {
        unlockDb(c->db);
        update_stats_add(c->vel->stats, keyspace_hits, 1);
        return;
    }
    llen = zsetLength(zobj);

    serverAssertWithInfo(c,ele,sdsEncodedObject(ele));

    if (zobj->encoding == OBJ_ENCODING_ZIPLIST) {
        unsigned char *zl = zobj->ptr;
        unsigned char *eptr, *sptr;

        eptr = ziplistIndex(zl,0);
        serverAssertWithInfo(c,zobj,eptr != NULL);
        sptr = ziplistNext(zl,eptr);
        serverAssertWithInfo(c,zobj,sptr != NULL);

        rank = 1;
        while(eptr != NULL) {
            if (ziplistCompare(eptr,ele->ptr,sdslen(ele->ptr)))
                break;
            rank++;
            zzlNext(zl,&eptr,&sptr);
        }

        if (eptr != NULL) {
            if (reverse)
                addReplyLongLong(c,llen-rank);
            else
                addReplyLongLong(c,rank-1);
        } else {
            addReply(c,shared.nullbulk);
        }
    } else if (zobj->encoding == OBJ_ENCODING_SKIPLIST) {
        zset *zs = zobj->ptr;
        zskiplist *zsl = zs->zsl;
        dictEntry *de;
        double score;

        ele = c->argv[2];
        de = dictFind(zs->dict,ele);
        if (de != NULL) {
            score = *(double*)dictGetVal(de);
            rank = zslGetRank(zsl,score,ele);
            serverAssertWithInfo(c,ele,rank); /* Existing elements always have a rank. */
            if (reverse)
                addReplyLongLong(c,llen-rank);
            else
                addReplyLongLong(c,rank-1);
        } else {
            addReply(c,shared.nullbulk);
        }
    } else {
        serverPanic("Unknown sorted set encoding");
    }

    unlockDb(c->db);
    update_stats_add(c->vel->stats, keyspace_hits, 1);
}

void zrankCommand(client *c) {
    zrankGenericCommand(c, 0);
}

void zrevrankCommand(client *c) {
    zrankGenericCommand(c, 1);
}

void zscanCommand(client *c) {
    scanGenericCommand(c,SCAN_TYPE_ZSET);
}


================================================
FILE: src/vr_t_zset.h
================================================
#ifndef _VR_T_ZSET_H_
#define _VR_T_ZSET_H_

/* Struct to hold a inclusive/exclusive range spec by score comparison. */
typedef struct {
    double min, max;
    int minex, maxex; /* are min or max exclusive? */
} zrangespec;

/* Struct to hold an inclusive/exclusive range spec by lexicographic comparison. */
typedef struct {
    robj *min, *max;  /* May be set to shared.(minstring|maxstring) */
    int minex, maxex; /* are min or max exclusive? */
} zlexrangespec;

typedef struct {
    robj *subject;
    int type; /* Set, sorted set */
    int encoding;
    double weight;

    union {
        /* Set iterators. */
        union _iterset {
            struct {
                intset *is;
                int ii;
            } is;
            struct {
                dict *dict;
                dictIterator *di;
                dictEntry *de;
            } ht;
        } set;

        /* Sorted set iterators. */
        union _iterzset {
            struct {
                unsigned char *zl;
                unsigned char *eptr, *sptr;
            } zl;
            struct {
                zset *zs;
                zskiplistNode *node;
            } sl;
        } zset;
    } iter;
} zsetopsrc;

/* Store value retrieved from the iterator. */
typedef struct {
    int flags;
    unsigned char _buf[32]; /* Private buffer. */
    robj *ele;
    unsigned char *estr;
    unsigned int elen;
    long long ell;
    double score;
} zsetopval;

zskiplistNode *zslCreateNode(int level, double score, robj *obj);
zskiplist *zslCreate(void);
void zslFreeNode(zskiplistNode *node);
void zslFree(zskiplist *zsl);
int zslRandomLevel(void);
zskiplistNode *zslInsert(zskiplist *zsl, double score, robj *obj);
void zslDeleteNode(zskiplist *zsl, zskiplistNode *x, zskiplistNode **update);
int zslDelete(zskiplist *zsl, double score, robj *obj);
int zslValueLteMax(double value, zrangespec *spec);
int zslIsInRange(zskiplist *zsl, zrangespec *range);
zskiplistNode *zslFirstInRange(zskiplist *zsl, zrangespec *range);
zskiplistNode *zslLastInRange(zskiplist *zsl, zrangespec *range);
unsigned long zslDeleteRangeByScore(zskiplist *zsl, zrangespec *range, dict *dict);
unsigned long zslDeleteRangeByLex(zskiplist *zsl, zlexrangespec *range, dict *dict);
unsigned long zslDeleteRangeByRank(zskiplist *zsl, unsigned int start, unsigned int end, dict *dict);
unsigned long zslGetRank(zskiplist *zsl, double score, robj *o);
zskiplistNode* zslGetElementByRank(zskiplist *zsl, unsigned long rank);
int zslParseLexRangeItem(robj *item, robj **dest, int *ex);
void zslFreeLexRange(zlexrangespec *spec);
int compareStringObjectsForLexRange(robj *a, robj *b);
int zslIsInLexRange(zskiplist *zsl, zlexrangespec *range);
zskiplistNode *zslFirstInLexRange(zskiplist *zsl, zlexrangespec *range);
zskiplistNode *zslLastInLexRange(zskiplist *zsl, zlexrangespec *range);
double zzlGetScore(unsigned char *sptr);
robj *ziplistGetObject(unsigned char *sptr);
int zzlCompareElements(unsigned char *eptr, unsigned char *cstr, unsigned int clen);
unsigned int zzlLength(unsigned char *zl);
void zzlNext(unsigned char *zl, unsigned char **eptr, unsigned char **sptr);
void zzlPrev(unsigned char *zl, unsigned char **eptr, unsigned char **sptr);
int zzlIsInRange(unsigned char *zl, zrangespec *range);
unsigned char *zzlFirstInRange(unsigned char *zl, zrangespec *range);
unsigned char *zzlLastInRange(unsigned char *zl, zrangespec *range);
int zzlIsInLexRange(unsigned char *zl, zlexrangespec *range);
unsigned char *zzlFirstInLexRange(unsigned char *zl, zlexrangespec *range);

unsigned char *zzlLastInLexRange(unsigned char *zl, zlexrangespec *range);
unsigned char *zzlFind(unsigned char *zl, robj *ele, double *score);
unsigned char *zzlDelete(unsigned char *zl, unsigned char *eptr);
unsigned char *zzlInsertAt(unsigned char *zl, unsigned char *eptr, robj *ele, double score);
unsigned char *zzlInsert(unsigned char *zl, robj *ele, double score);
unsigned char *zzlDeleteRangeByScore(unsigned char *zl, zrangespec *range, unsigned long *deleted);
unsigned char *zzlDeleteRangeByLex(unsigned char *zl, zlexrangespec *range, unsigned long *deleted);
unsigned char *zzlDeleteRangeByRank(unsigned char *zl, unsigned int start, unsigned int end, unsigned long *deleted);
unsigned int zsetLength(robj *zobj);
void zsetConvert(robj *zobj, int encoding);
void zsetConvertToZiplistIfNeeded(robj *zobj, size_t maxelelen);
int zsetScore(robj *zobj, robj *member, double *score);

void zaddGenericCommand(client *c, int flags);
void zaddCommand(client *c);
void zincrbyCommand(client *c);
void zremCommand(client *c);
void zremrangeGenericCommand(client *c, int rangetype);
void zremrangebyrankCommand(client *c);
void zremrangebyscoreCommand(client *c);
void zremrangebylexCommand(client *c) ;

void zuiInitIterator(zsetopsrc *op);
void zuiClearIterator(zsetopsrc *op);
int zuiLength(zsetopsrc *op);

/* Check if the current value is valid. If so, store it in the passed structure
 * and move to the next element. If not valid, this means we have reached the
 * end of the structure and can abort. */
int zuiNext(zsetopsrc *op, zsetopval *val);
int zuiLongLongFromValue(zsetopval *val);
robj *zuiObjectFromValue(zsetopval *val);
int zuiBufferFromValue(zsetopval *val);

/* Find value pointed to by val in the source pointer to by op. When found,
 * return 1 and store its score in target. Return 0 otherwise. */
int zuiFind(zsetopsrc *op, zsetopval *val, double *score);
int zuiCompareByCardinality(const void *s1, const void *s2);
void zunionInterGenericCommand(client *c, robj *dstkey, int op);
void zunionstoreCommand(client *c);
void zinterstoreCommand(client *c);
void zrangeGenericCommand(client *c, int reverse);
void zrangeCommand(client *c);
void zrevrangeCommand(client *c);

/* This command implements ZRANGEBYSCORE, ZREVRANGEBYSCORE. */
void genericZrangebyscoreCommand(client *c, int reverse);
void zrangebyscoreCommand(client *c);
void zrevrangebyscoreCommand(client *c);
void zcountCommand(client *c);
void zlexcountCommand(client *c);

/* This command implements ZRANGEBYLEX, ZREVRANGEBYLEX. */
void genericZrangebylexCommand(client *c, int reverse);
void zrangebylexCommand(client *c);
void zrevrangebylexCommand(client *c);
void zcardCommand(client *c);
void zscoreCommand(client *c);
void zrankGenericCommand(client *c, int reverse);
void zrankCommand(client *c);
void zrevrankCommand(client *c);
void zscanCommand(client *c);

#endif


================================================
FILE: src/vr_thread.c
================================================
#include <vr_core.h>

int
vr_thread_init(vr_thread *thread)
{    
    if (thread == NULL) {
        return VR_ERROR;
    }

    thread->id = 0;
    thread->thread_id = 0;
    thread->fun_run = NULL;
    thread->data = NULL;

    return VR_OK;
}

void
vr_thread_deinit(vr_thread *thread)
{
    if (thread == NULL) {
        return;
    }

    thread->id = 0;
    thread->thread_id = 0;
    thread->fun_run = NULL;
    thread->data = NULL;
}

static void *vr_thread_run(void *data)
{
    vr_thread *thread = data;
    srand(vr_usec_now()^(int)pthread_self());
    
    thread->fun_run(thread->data);
}

int vr_thread_start(vr_thread *thread)
{
    pthread_attr_t attr;
    pthread_attr_init(&attr);
    
    if (thread == NULL || thread->fun_run == NULL) {
        return VR_ERROR;
    }

    pthread_create(&thread->thread_id, 
        &attr, vr_thread_run, thread);

    return VR_OK;
}


================================================
FILE: src/vr_thread.h
================================================
#ifndef _VR_THREAD_H_
#define _VR_THREAD_H_

typedef void *(*vr_thread_func_t)(void *data);

typedef struct vr_thread {
    int id;
    pthread_t thread_id;

    vr_thread_func_t fun_run;
    void *data;
}vr_thread;

int vr_thread_init(vr_thread *thread);
void vr_thread_deinit(vr_thread *thread);
int vr_thread_start(vr_thread *thread);

#endif


================================================
FILE: src/vr_util.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <stdarg.h>
#include <string.h>
#include <unistd.h>
#include <fcntl.h>
#include <netdb.h>

#include <sys/time.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <sys/ioctl.h>

#include <netinet/in.h>
#include <netinet/tcp.h>

#include <vr_core.h>

#ifdef VR_HAVE_BACKTRACE
# include <execinfo.h>
#endif

int
vr_set_blocking(int sd)
{
    int flags;

    flags = fcntl(sd, F_GETFL, 0);
    if (flags < 0) {
        return flags;
    }

    return fcntl(sd, F_SETFL, flags & ~O_NONBLOCK);
}

int
vr_set_nonblocking(int sd)
{
    int flags;

    flags = fcntl(sd, F_GETFL, 0);
    if (flags < 0) {
        return flags;
    }

    return fcntl(sd, F_SETFL, flags | O_NONBLOCK);
}

int
vr_set_reuseaddr(int sd)
{
    int reuse;
    socklen_t len;

    reuse = 1;
    len = sizeof(reuse);

    return setsockopt(sd, SOL_SOCKET, SO_REUSEADDR, &reuse, len);
}

/*
 * Disable Nagle algorithm on TCP socket.
 *
 * This option helps to minimize transmit latency by disabling coalescing
 * of data to fill up a TCP segment inside the kernel. Sockets with this
 * option must use readv() or writev() to do data transfer in bulk and
 * hence avoid the overhead of small packets.
 */
int
vr_set_tcpnodelay(int sd)
{
    int nodelay;
    socklen_t len;

    nodelay = 1;
    len = sizeof(nodelay);

    return setsockopt(sd, IPPROTO_TCP, TCP_NODELAY, &nodelay, len);
}

int
vr_set_linger(int sd, int timeout)
{
    struct linger linger;
    socklen_t len;

    linger.l_onoff = 1;
    linger.l_linger = timeout;

    len = sizeof(linger);

    return setsockopt(sd, SOL_SOCKET, SO_LINGER, &linger, len);
}

int
vr_set_sndbuf(int sd, int size)
{
    socklen_t len;

    len = sizeof(size);

    return setsockopt(sd, SOL_SOCKET, SO_SNDBUF, &size, len);
}

int
vr_set_rcvbuf(int sd, int size)
{
    socklen_t len;

    len = sizeof(size);

    return setsockopt(sd, SOL_SOCKET, SO_RCVBUF, &size, len);
}

int
vr_get_soerror(int sd)
{
    int status, err;
    socklen_t len;

    err = 0;
    len = sizeof(err);

    status = getsockopt(sd, SOL_SOCKET, SO_ERROR, &err, &len);
    if (status == 0) {
        errno = err;
    }

    return status;
}

int
vr_get_sndbuf(int sd)
{
    int status, size;
    socklen_t len;

    size = 0;
    len = sizeof(size);

    status = getsockopt(sd, SOL_SOCKET, SO_SNDBUF, &size, &len);
    if (status < 0) {
        return status;
    }

    return size;
}

int
vr_get_rcvbuf(int sd)
{
    int status, size;
    socklen_t len;

    size = 0;
    len = sizeof(size);

    status = getsockopt(sd, SOL_SOCKET, SO_RCVBUF, &size, &len);
    if (status < 0) {
        return status;
    }

    return size;
}

int
vr_set_tcpkeepalive(int sd, int keepidle, int keepinterval, int keepcount)
{
    rstatus_t status;
    int tcpkeepalive;
    socklen_t len;

    tcpkeepalive = 1;
    len = sizeof(tcpkeepalive);

    status = setsockopt(sd, SOL_SOCKET, SO_KEEPALIVE, &tcpkeepalive, len);
    if (status < 0) {
        log_error("setsockopt SO_KEEPALIVE call error(%s)", strerror(errno));
        return VR_ERROR;
    }
    
#ifdef SOL_TCP
    if (keepidle > 0) {
        len = sizeof(keepidle);
        status = setsockopt(sd, SOL_TCP, TCP_KEEPIDLE, &keepidle, len);
        if (status < 0) {
            log_error("setsockopt TCP_KEEPIDLE call error(%s)", strerror(errno));
            return VR_ERROR;
        }
    }

    if (keepinterval > 0) {
        len = sizeof(keepinterval);
        status = setsockopt(sd, SOL_TCP, TCP_KEEPINTVL, &keepinterval, len);
        if (status < 0) {
            log_error("setsockopt TCP_KEEPINTVL call error(%s)", strerror(errno));
            return VR_ERROR;
        }
    }

    if (keepcount > 0) {
        len = sizeof(keepcount);
        status = setsockopt(sd, SOL_TCP, TCP_KEEPCNT, &keepcount, len);
        if (status < 0) {
            log_error("setsockopt TCP_KEEPCNT call error(%s)", strerror(errno));
            return VR_ERROR;
        }
    }
#endif

    return VR_OK;
}

int
_vr_atoi(char *line, size_t n)
{
    int value;

    if (n == 0) {
        return -1;
    }

    for (value = 0; n--; line++) {
        if (*line < '0' || *line > '9') {
            return -1;
        }

        value = value * 10 + (*line - '0');
    }

    if (value < 0) {
        return -1;
    }

    return value;
}

/* Return the number of digits of 'v' when converted to string in radix 10.
 * See ll2string() for more information. */
uint32_t digits10(uint64_t v) {
    if (v < 10) return 1;
    if (v < 100) return 2;
    if (v < 1000) return 3;
    if (v < 1000000000000UL) {
        if (v < 100000000UL) {
            if (v < 1000000) {
                if (v < 10000) return 4;
                return 5 + (v >= 100000);
            }
            return 7 + (v >= 10000000UL);
        }
        if (v < 10000000000UL) {
            return 9 + (v >= 1000000000UL);
        }
        return 11 + (v >= 100000000000UL);
    }
    return 12 + digits10(v / 1000000000000UL);
}

/* Like digits10() but for signed values. */
uint32_t sdigits10(int64_t v) {
    if (v < 0) {
        /* Abs value of LLONG_MIN requires special handling. */
        uint64_t uv = (v != LLONG_MIN) ?
                      (uint64_t)-v : ((uint64_t) LLONG_MAX)+1;
        return digits10(uv)+1; /* +1 for the minus. */
    } else {
        return digits10(v);
    }
}

/* Convert a long long into a string. Returns the number of
 * characters needed to represent the number.
 * If the buffer is not big enough to store the string, 0 is returned.
 *
 * Based on the following article (that apparently does not provide a
 * novel approach but only publicizes an already used technique):
 *
 * https://www.facebook.com/notes/facebook-engineering/three-optimization-tips-for-c/10151361643253920
 *
 * Modified in order to handle signed integers since the original code was
 * designed for unsigned integers. */
int
ll2string(char* dst, size_t dstlen, long long svalue) {
    static const char digits[201] =
        "0001020304050607080910111213141516171819"
        "2021222324252627282930313233343536373839"
        "4041424344454647484950515253545556575859"
        "6061626364656667686970717273747576777879"
        "8081828384858687888990919293949596979899";
    int negative;
    unsigned long long value;

    /* The main loop works with 64bit unsigned integers for simplicity, so
     * we convert the number here and remember if it is negative. */
    if (svalue < 0) {
        if (svalue != LLONG_MIN) {
            value = -svalue;
        } else {
            value = ((unsigned long long) LLONG_MAX)+1;
        }
        negative = 1;
    } else {
        value = svalue;
        negative = 0;
    }

    /* Check length. */
    uint32_t const length = digits10(value)+negative;
    if (length >= dstlen) return 0;

    /* Null term. */
    uint32_t next = length;
    dst[next] = '\0';
    next--;
    while (value >= 100) {
        int const i = (value % 100) * 2;
        value /= 100;
        dst[next] = digits[i + 1];
        dst[next - 1] = digits[i];
        next -= 2;
    }

    /* Handle last 1-2 digits. */
    if (value < 10) {
        dst[next] = '0' + (uint32_t) value;
    } else {
        int i = (uint32_t) value * 2;
        dst[next] = digits[i + 1];
        dst[next - 1] = digits[i];
    }

    /* Add sign. */
    if (negative) dst[0] = '-';
    return length;
}

/* Convert a string into a long long. Returns 1 if the string could be parsed
 * into a (non-overflowing) long long, 0 otherwise. The value will be set to
 * the parsed value when appropriate. */
int
string2ll(const char *s, size_t slen, long long *value) {
    const char *p = s;
    size_t plen = 0;
    int negative = 0;
    unsigned long long v;

    if (plen == slen)
        return 0;

    /* Special case: first and only digit is 0. */
    if (slen == 1 && p[0] == '0') {
        if (value != NULL) *value = 0;
        return 1;
    }

    if (p[0] == '-') {
        negative = 1;
        p++; plen++;

        /* Abort on only a negative sign. */
        if (plen == slen)
            return 0;
    }

    /* First digit should be 1-9, otherwise the string should just be 0. */
    if (p[0] >= '1' && p[0] <= '9') {
        v = p[0]-'0';
        p++; plen++;
    } else if (p[0] == '0' && slen == 1) {
        *value = 0;
        return 1;
    } else {
        return 0;
    }

    while (plen < slen && p[0] >= '0' && p[0] <= '9') {
        if (v > (ULLONG_MAX / 10)) /* Overflow. */
            return 0;
        v *= 10;

        if (v > (ULLONG_MAX - (p[0]-'0'))) /* Overflow. */
            return 0;
        v += p[0]-'0';

        p++; plen++;
    }

    /* Return if not all bytes were used. */
    if (plen < slen)
        return 0;

    if (negative) {
        if (v > ((unsigned long long)(-(LLONG_MIN+1))+1)) /* Overflow. */
            return 0;
        if (value != NULL) *value = -v;
    } else {
        if (v > LLONG_MAX) /* Overflow. */
            return 0;
        if (value != NULL) *value = v;
    }
    return 1;
}

/* Convert a string into a long. Returns 1 if the string could be parsed into a
 * (non-overflowing) long, 0 otherwise. The value will be set to the parsed
 * value when appropriate. */
int string2l(const char *s, size_t slen, long *lval) {
    long long llval;

    if (!string2ll(s,slen,&llval))
        return 0;

    if (llval < LONG_MIN || llval > LONG_MAX)
        return 0;

    *lval = (long)llval;
    return 1;
}

/* Convert a double to a string representation. Returns the number of bytes
 * required. The representation should always be parsable by strtod(3). */
int d2string(char *buf, size_t len, double value) {
    if (isnan(value)) {
        len = snprintf(buf,len,"nan");
    } else if (isinf(value)) {
        if (value < 0)
            len = snprintf(buf,len,"-inf");
        else
            len = snprintf(buf,len,"inf");
    } else if (value == 0) {
        /* See: http://en.wikipedia.org/wiki/Signed_zero, "Comparisons". */
        if (1.0/value < 0)
            len = snprintf(buf,len,"-0");
        else
            len = snprintf(buf,len,"0");
    } else {
#if (DBL_MANT_DIG >= 52) && (LLONG_MAX == 0x7fffffffffffffffLL)
        /* Check if the float is in a safe range to be casted into a
         * long long. We are assuming that long long is 64 bit here.
         * Also we are assuming that there are no implementations around where
         * double has precision < 52 bit.
         *
         * Under this assumptions we test if a double is inside an interval
         * where casting to long long is safe. Then using two castings we
         * make sure the decimal part is zero. If all this is true we use
         * integer printing function that is much faster. */
        double min = -4503599627370495; /* (2^52)-1 */
        double max = 4503599627370496; /* -(2^52) */
        if (value > min && value < max && value == ((double)((long long)value)))
            len = ll2string(buf,len,(long long)value);
        else
#endif
            len = snprintf(buf,len,"%.17g",value);
    }

    return len;
}

bool
vr_valid_port(int n)
{
    if (n < 1 || n > UINT16_MAX) {
        return false;
    }

    return true;
}

/*
 * Send n bytes on a blocking descriptor
 */
ssize_t
_vr_sendn(int sd, const void *vptr, size_t n)
{
    size_t nleft;
    ssize_t	nsend;
    const char *ptr;

    ptr = vptr;
    nleft = n;
    while (nleft > 0) {
        nsend = send(sd, ptr, nleft, 0);
        if (nsend < 0) {
            if (errno == EINTR) {
                continue;
            }
            return nsend;
        }
        if (nsend == 0) {
            return -1;
        }

        nleft -= (size_t)nsend;
        ptr += nsend;
    }

    return (ssize_t)n;
}

/*
 * Recv n bytes from a blocking descriptor
 */
ssize_t
_vr_recvn(int sd, void *vptr, size_t n)
{
	size_t nleft;
	ssize_t	nrecv;
	char *ptr;

	ptr = vptr;
	nleft = n;
	while (nleft > 0) {
        nrecv = recv(sd, ptr, nleft, 0);
        if (nrecv < 0) {
            if (errno == EINTR) {
                continue;
            }
            return nrecv;
        }
        if (nrecv == 0) {
            break;
        }

        nleft -= (size_t)nrecv;
        ptr += nrecv;
    }

    return (ssize_t)(n - nleft);
}

/*
 * Return the current time in microseconds since Epoch
 */
int64_t
vr_usec_now(void)
{
    struct timeval now;
    int64_t usec;
    int status;

    status = gettimeofday(&now, NULL);
    if (status < 0) {
        log_error("gettimeofday failed: %s", strerror(errno));
        return -1;
    }

    usec = (int64_t)now.tv_sec * 1000000LL + (int64_t)now.tv_usec;

    return usec;
}

/*
 * Return the current time in milliseconds since Epoch
 */
int64_t
vr_msec_now(void)
{
    return vr_usec_now() / 1000LL;
}

static int
vr_resolve_inet(sds name, int port, struct sockinfo *si)
{
    int status;
    struct addrinfo *ai, *cai; /* head and current addrinfo */
    struct addrinfo hints;
    char *node, service[VR_UINTMAX_MAXLEN];
    bool found;

    ASSERT(vr_valid_port(port));

    memset(&hints, 0, sizeof(hints));
    hints.ai_flags = AI_NUMERICSERV;
    hints.ai_family = AF_UNSPEC;     /* AF_INET or AF_INET6 */
    hints.ai_socktype = SOCK_STREAM;
    hints.ai_protocol = 0;
    hints.ai_addrlen = 0;
    hints.ai_addr = NULL;
    hints.ai_canonname = NULL;

    if (name != NULL) {
        node = (char *)name;
    } else {
        /*
         * If AI_PASSIVE flag is specified in hints.ai_flags, and node is
         * NULL, then the returned socket addresses will be suitable for
         * bind(2)ing a socket that will accept(2) connections. The returned
         * socket address will contain the wildcard IP address.
         */
        node = NULL;
        hints.ai_flags |= AI_PASSIVE;
    }

    dsnprintf(service, VR_UINTMAX_MAXLEN, "%d", port);

    /*
     * getaddrinfo() returns zero on success or one of the error codes listed
     * in gai_strerror(3) if an error occurs
     */
    status = getaddrinfo(node, service, &hints, &ai);
    if (status != 0) {
        log_error("address resolution of node '%s' service '%s' failed: %s",
                  node, service, gai_strerror(status));
        return -1;
    }

    /*
     * getaddrinfo() can return a linked list of more than one addrinfo,
     * since we requested for both AF_INET and AF_INET6 addresses and the
     * host itself can be multi-homed. Since we don't care whether we are
     * using ipv4 or ipv6, we just use the first address from this collection
     * in the order in which it was returned.
     *
     * The sorting function used within getaddrinfo() is defined in RFC 3484;
     * the order can be tweaked for a particular system by editing
     * /etc/gai.conf
     */
    for (cai = ai, found = false; cai != NULL; cai = cai->ai_next) {
        si->family = cai->ai_family;
        si->addrlen = cai->ai_addrlen;
        vr_memcpy(&si->addr, cai->ai_addr, si->addrlen);
        found = true;
        break;
    }

    freeaddrinfo(ai);

    return !found ? -1 : 0;
}

static int
vr_resolve_unix(sds name, struct sockinfo *si)
{
    struct sockaddr_un *un;

    if (sdslen(name) >= VR_UNIX_ADDRSTRLEN) {
        return -1;
    }

    un = &si->addr.un;

    un->sun_family = AF_UNIX;
    vr_memcpy(un->sun_path, name, sdslen(name));
    un->sun_path[sdslen(name)] = '\0';

    si->family = AF_UNIX;
    si->addrlen = sizeof(*un);
    /* si->addr is an alias of un */

    return 0;
}

/*
 * Resolve a hostname and service by translating it to socket address and
 * return it in si
 *
 * This routine is reentrant
 */
int
vr_resolve(sds name, int port, struct sockinfo *si)
{
    if (name != NULL && name[0] == '/') {
        return vr_resolve_unix(name, si);
    }

    return vr_resolve_inet(name, port, si);
}

static int vr_net_peer_to_string(int fd, char *ip, size_t ip_len, int *port) {
    struct sockaddr_storage sa;
    socklen_t salen = sizeof(sa);

    if (getpeername(fd,(struct sockaddr*)&sa,&salen) == -1) goto error;
    if (ip_len == 0) goto error;

    if (sa.ss_family == AF_INET) {
        struct sockaddr_in *s = (struct sockaddr_in *)&sa;
        if (ip) inet_ntop(AF_INET,(void*)&(s->sin_addr),ip,ip_len);
        if (port) *port = ntohs(s->sin_port);
    } else if (sa.ss_family == AF_INET6) {
        struct sockaddr_in6 *s = (struct sockaddr_in6 *)&sa;
        if (ip) inet_ntop(AF_INET6,(void*)&(s->sin6_addr),ip,ip_len);
        if (port) *port = ntohs(s->sin6_port);
    } else if (sa.ss_family == AF_UNIX) {
        if (ip) strncpy(ip,"/unixsocket",ip_len);
        if (port) *port = 0;
    } else {
        goto error;
    }
    return 0;

error:
    if (ip) {
        if (ip_len >= 2) {
            ip[0] = '?';
            ip[1] = '\0';
        } else if (ip_len == 1) {
            ip[0] = '\0';
        }
    }
    if (port) *port = 0;
    return -1;
}

/* Format an IP,port pair into something easy to parse. If IP is IPv6
 * (matches for ":"), the ip is surrounded by []. IP and port are just
 * separated by colons. This the standard to display addresses within Redis. */
static int vr_net_format_addr(char *buf, size_t buf_len, char *ip, int port) {
    return snprintf(buf,buf_len, strchr(ip,':') ?
           "[%s]:%d" : "%s:%d", ip, port);
}

/* Like anetFormatAddr() but extract ip and port from the socket's peer. */
int vr_net_format_peer(int fd, char *buf, size_t buf_len) {
    char ip[VR_INET6_ADDRSTRLEN];
    int port;

    vr_net_peer_to_string(fd,ip,sizeof(ip),&port);
    return vr_net_format_addr(buf, buf_len, ip, port);
}

/* Generate the Vire "Run ID", a SHA1-sized random number that identifies a
 * given execution of Vire, so that if you are talking with an instance
 * having run_id == A, and you reconnect and it has run_id == B, you can be
 * sure that it is either a different instance or it was restarted. */
void
get_random_hex_chars(char *p, unsigned int len) {
    char *charset = "0123456789abcdef";
    unsigned int j;

    /* Global state. */
    static int seed_initialized = 0;
    static unsigned char seed[20]; /* The SHA1 seed, from /dev/urandom. */
    static uint64_t counter = 0; /* The counter we hash with the seed. */

    if (!seed_initialized) {
        /* Initialize a seed and use SHA1 in counter mode, where we hash
         * the same seed with a progressive counter. For the goals of this
         * function we just need non-colliding strings, there are no
         * cryptographic security needs. */
        FILE *fp = fopen("/dev/urandom","r");
        if (fp && fread(seed,sizeof(seed),1,fp) == 1)
            seed_initialized = 1;
        if (fp) fclose(fp);
    }

    if (seed_initialized) {
        while(len) {
            unsigned char digest[20];
            SHA1_CTX ctx;
            unsigned int copylen = len > 20 ? 20 : len;

            SHA1Init(&ctx);
            SHA1Update(&ctx, seed, sizeof(seed));
            SHA1Update(&ctx, (unsigned char*)&counter,sizeof(counter));
            SHA1Final(digest, &ctx);
            counter++;

            memcpy(p,digest,copylen);
            /* Convert to hex digits. */
            for (j = 0; j < copylen; j++) p[j] = charset[p[j] & 0x0F];
            len -= copylen;
            p += copylen;
        }
    } else {
        /* If we can't read from /dev/urandom, do some reasonable effort
         * in order to create some entropy, since this function is used to
         * generate run_id and cluster instance IDs */
        char *x = p;
        unsigned int l = len;
        struct timeval tv;
        pid_t pid = getpid();

        /* Use time and PID to fill the initial array. */
        gettimeofday(&tv,NULL);
        if (l >= sizeof(tv.tv_usec)) {
            memcpy(x,&tv.tv_usec,sizeof(tv.tv_usec));
            l -= sizeof(tv.tv_usec);
            x += sizeof(tv.tv_usec);
        }
        if (l >= sizeof(tv.tv_sec)) {
            memcpy(x,&tv.tv_sec,sizeof(tv.tv_sec));
            l -= sizeof(tv.tv_sec);
            x += sizeof(tv.tv_sec);
        }
        if (l >= sizeof(pid)) {
            memcpy(x,&pid,sizeof(pid));
            l -= sizeof(pid);
            x += sizeof(pid);
        }
        /* Finally xor it with rand() output, that was already seeded with
         * time() at startup, and convert to hex digits. */
        for (j = 0; j < len; j++) {
            p[j] ^= rand();
            p[j] = charset[p[j] & 0x0F];
        }
    }
}

/* Glob-style pattern matching. */
int stringmatchlen(const char *pattern, int patternLen,
        const char *string, int stringLen, int nocase)
{
    while(patternLen) {
        switch(pattern[0]) {
        case '*':
            while (pattern[1] == '*') {
                pattern++;
                patternLen--;
            }
            if (patternLen == 1)
                return 1; /* match */
            while(stringLen) {
                if (stringmatchlen(pattern+1, patternLen-1,
                            string, stringLen, nocase))
                    return 1; /* match */
                string++;
                stringLen--;
            }
            return 0; /* no match */
            break;
        case '?':
            if (stringLen == 0)
                return 0; /* no match */
            string++;
            stringLen--;
            break;
        case '[':
        {
            int not, match;

            pattern++;
            patternLen--;
            not = pattern[0] == '^';
            if (not) {
                pattern++;
                patternLen--;
            }
            match = 0;
            while(1) {
                if (pattern[0] == '\\') {
                    pattern++;
                    patternLen--;
                    if (pattern[0] == string[0])
                        match = 1;
                } else if (pattern[0] == ']') {
                    break;
                } else if (patternLen == 0) {
                    pattern--;
                    patternLen++;
                    break;
                } else if (pattern[1] == '-' && patternLen >= 3) {
                    int start = pattern[0];
                    int end = pattern[2];
                    int c = string[0];
                    if (start > end) {
                        int t = start;
                        start = end;
                        end = t;
                    }
                    if (nocase) {
                        start = tolower(start);
                        end = tolower(end);
                        c = tolower(c);
                    }
                    pattern += 2;
                    patternLen -= 2;
                    if (c >= start && c <= end)
                        match = 1;
                } else {
                    if (!nocase) {
                        if (pattern[0] == string[0])
                            match = 1;
                    } else {
                        if (tolower((int)pattern[0]) == tolower((int)string[0]))
                            match = 1;
                    }
                }
                pattern++;
                patternLen--;
            }
            if (not)
                match = !match;
            if (!match)
                return 0; /* no match */
            string++;
            stringLen--;
            break;
        }
        case '\\':
            if (patternLen >= 2) {
                pattern++;
                patternLen--;
            }
            /* fall through */
        default:
            if (!nocase) {
                if (pattern[0] != string[0])
                    return 0; /* no match */
            } else {
                if (tolower((int)pattern[0]) != tolower((int)string[0]))
                    return 0; /* no match */
            }
            string++;
            stringLen--;
            break;
        }
        pattern++;
        patternLen--;
        if (stringLen == 0) {
            while(*pattern == '*') {
                pattern++;
                patternLen--;
            }
            break;
        }
    }
    if (patternLen == 0 && stringLen == 0)
        return 1;
    return 0;
}

int stringmatch(const char *pattern, const char *string, int nocase) {
    return stringmatchlen(pattern,strlen(pattern),string,strlen(string),nocase);
}

/* Toggle the 16 bit unsigned integer pointed by *p from little endian to
 * big endian */
void memrev16(void *p) {
    unsigned char *x = p, t;

    t = x[0];
    x[0] = x[1];
    x[1] = t;
}

/* Toggle the 32 bit unsigned integer pointed by *p from little endian to
 * big endian */
void memrev32(void *p) {
    unsigned char *x = p, t;

    t = x[0];
    x[0] = x[3];
    x[3] = t;
    t = x[1];
    x[1] = x[2];
    x[2] = t;
}

/* Toggle the 64 bit unsigned integer pointed by *p from little endian to
 * big endian */
void memrev64(void *p) {
    unsigned char *x = p, t;

    t = x[0];
    x[0] = x[7];
    x[7] = t;
    t = x[1];
    x[1] = x[6];
    x[6] = t;
    t = x[2];
    x[2] = x[5];
    x[5] = t;
    t = x[3];
    x[3] = x[4];
    x[4] = t;
}

uint16_t intrev16(uint16_t v) {
    memrev16(&v);
    return v;
}

uint32_t intrev32(uint32_t v) {
    memrev32(&v);
    return v;
}

uint64_t intrev64(uint64_t v) {
    memrev64(&v);
    return v;
}

/* Convert a string representing an amount of memory into the number of
 * bytes, so for instance memtoll("1Gb") will return 1073741824 that is
 * (1024*1024*1024).
 *
 * On parsing error, if *err is not NULL, it's set to 1, otherwise it's
 * set to 0. On error the function return value is 0, regardless of the
 * fact 'err' is NULL or not. */
long long memtoll(const char *p, int *err) {
    const char *u;
    char buf[128];
    long mul; /* unit multiplier */
    long long val;
    unsigned int digits;

    if (err) *err = 0;

    /* Search the first non digit character. */
    u = p;
    if (*u == '-') u++;
    while(*u && isdigit(*u)) u++;
    if (*u == '\0' || !strcasecmp(u,"b")) {
        mul = 1;
    } else if (!strcasecmp(u,"k")) {
        mul = 1000;
    } else if (!strcasecmp(u,"kb")) {
        mul = 1024;
    } else if (!strcasecmp(u,"m")) {
        mul = 1000*1000;
    } else if (!strcasecmp(u,"mb")) {
        mul = 1024*1024;
    } else if (!strcasecmp(u,"g")) {
        mul = 1000L*1000*1000;
    } else if (!strcasecmp(u,"gb")) {
        mul = 1024L*1024*1024;
    } else {
        if (err) *err = 1;
        return 0;
    }

    /* Copy the digits into a buffer, we'll use strtoll() to convert
     * the digit (without the unit) into a number. */
    digits = u-p;
    if (digits >= sizeof(buf)) {
        if (err) *err = 1;
        return 0;
    }
    memcpy(buf,p,digits);
    buf[digits] = '\0';

    char *endptr;
    errno = 0;
    val = strtoll(buf,&endptr,10);
    if ((val == 0 && errno == EINVAL) || *endptr != '\0') {
        if (err) *err = 1;
        return 0;
    }
    return val*mul;
}

/* Convert an amount of bytes into a human readable string in the form
 * of 100B, 2G, 100M, 4K, and so forth. */
void bytesToHuman(char *s, unsigned long long n) {
    double d;

    if (n < 1024) {
        /* Bytes */
        sprintf(s,"%lluB",n);
        return;
    } else if (n < (1024*1024)) {
        d = (double)n/(1024);
        sprintf(s,"%.2fK",d);
    } else if (n < (1024LL*1024*1024)) {
        d = (double)n/(1024*1024);
        sprintf(s,"%.2fM",d);
    } else if (n < (1024LL*1024*1024*1024)) {
        d = (double)n/(1024LL*1024*1024);
        sprintf(s,"%.2fG",d);
    } else if (n < (1024LL*1024*1024*1024*1024)) {
        d = (double)n/(1024LL*1024*1024*1024);
        sprintf(s,"%.2fT",d);
    } else if (n < (1024LL*1024*1024*1024*1024*1024)) {
        d = (double)n/(1024LL*1024*1024*1024*1024);
        sprintf(s,"%.2fP",d);
    } else {
        /* Let's hope we never need this */
        sprintf(s,"%lluB",n);
    }
}

/* Given the filename, return the absolute path as an SDS string, or NULL
 * if it fails for some reason. Note that "filename" may be an absolute path
 * already, this will be detected and handled correctly.
 *
 * The function does not try to normalize everything, but only the obvious
 * case of one or more "../" appearning at the start of "filename"
 * relative path. */
sds getAbsolutePath(char *filename) {
    char cwd[1024];
    sds abspath;
    sds relpath = sdsnew(filename);

    relpath = sdstrim(relpath," \r\n\t");
    if (relpath[0] == '/') return relpath; /* Path is already absolute. */

    /* If path is relative, join cwd and relative path. */
    if (getcwd(cwd,sizeof(cwd)) == NULL) {
        sdsfree(relpath);
        return NULL;
    }
    abspath = sdsnew(cwd);
    if (sdslen(abspath) && abspath[sdslen(abspath)-1] != '/')
        abspath = sdscat(abspath,"/");

    /* At this point we have the current path always ending with "/", and
     * the trimmed relative path. Try to normalize the obvious case of
     * trailing ../ elements at the start of the path.
     *
     * For every "../" we find in the filename, we remove it and also remove
     * the last element of the cwd, unless the current cwd is "/". */
    while (sdslen(relpath) >= 3 &&
           relpath[0] == '.' && relpath[1] == '.' && relpath[2] == '/')
    {
        sdsrange(relpath,3,-1);
        if (sdslen(abspath) > 1) {
            char *p = abspath + sdslen(abspath)-2;
            int trimlen = 1;

            while(*p != '/') {
                p--;
                trimlen++;
            }
            sdsrange(abspath,0,-(trimlen+1));
        }
    }

    /* Finally glue the two parts together. */
    abspath = sdscatsds(abspath,relpath);
    sdsfree(relpath);
    return abspath;
}


================================================
FILE: src/vr_util.h
================================================
#ifndef _VR_UTIL_H_
#define _VR_UTIL_H_

#include <stdarg.h>
#include <stdint.h>
#include <stdbool.h>

#include <netinet/in.h>
#include <sys/un.h>

/* Double expansion needed for stringification of macro values. */
#define __xstr(s) __str(s)
#define __str(s) #s

#define VR_INET4_ADDRSTRLEN (sizeof("255.255.255.255") - 1)
#define VR_INET6_ADDRSTRLEN \
    (sizeof("ffff:ffff:ffff:ffff:ffff:ffff:255.255.255.255") - 1)
#define VR_INET_ADDRSTRLEN  MAX(VR_INET4_ADDRSTRLEN, VR_INET6_ADDRSTRLEN)
#define VR_UNIX_ADDRSTRLEN  \
    (sizeof(struct sockaddr_un) - offsetof(struct sockaddr_un, sun_path))
    
#define VR_INET_PEER_ID_LEN (VR_INET_ADDRSTRLEN+32) /* Must be enough for ip:port */

#define VR_MAXHOSTNAMELEN   256

/*
 * Length of 1 byte, 2 bytes, 4 bytes, 8 bytes and largest integral
 * type (uintmax_t) in ascii, including the null terminator '\0'
 *
 * From stdint.h, we have:
 * # define UINT8_MAX	(255)
 * # define UINT16_MAX	(65535)
 * # define UINT32_MAX	(4294967295U)
 * # define UINT64_MAX	(__UINT64_C(18446744073709551615))
 */
#define VR_UINT8_MAXLEN     (3 + 1)
#define VR_UINT16_MAXLEN    (5 + 1)
#define VR_UINT32_MAXLEN    (10 + 1)
#define VR_UINT64_MAXLEN    (20 + 1)
#define VR_UINTMAX_MAXLEN   VR_UINT64_MAXLEN

#define LONG_STR_SIZE       21  /* Bytes needed for long -> str */

/*
 * Make data 'd' or pointer 'p', n-byte aligned, where n is a power of 2
 * of 2.
 */
#define VR_ALIGNMENT        sizeof(unsigned long) /* platform word */
#define VR_ALIGN(d, n)      (((d) + (n - 1)) & ~(n - 1))
#define VR_ALIGN_PTR(p, n)  \
    (void *) (((uintptr_t) (p) + ((uintptr_t) n - 1)) & ~((uintptr_t) n - 1))

/*
 * Wrapper to workaround well known, safe, implicit type conversion when
 * invoking system calls.
 */
#define vr_gethostname(_name, _len) \
    gethostname((char *)_name, (size_t)_len)

#define vr_atoi(_line, _n)          \
    _vr_atoi((char *)_line, (size_t)_n)

int vr_set_blocking(int sd);
int vr_set_nonblocking(int sd);
int vr_set_reuseaddr(int sd);
int vr_set_tcpnodelay(int sd);
int vr_set_linger(int sd, int timeout);
int vr_set_sndbuf(int sd, int size);
int vr_set_rcvbuf(int sd, int size);
int vr_get_soerror(int sd);
int vr_get_sndbuf(int sd);
int vr_get_rcvbuf(int sd);
int vr_set_tcpkeepalive(int sd, int keepidle, int keepinterval, int keepcount);

int _vr_atoi(char *line, size_t n);
uint32_t digits10(uint64_t v);
uint32_t sdigits10(int64_t v);
int ll2string(char* dst, size_t dstlen, long long svalue);
int string2ll(const char *s, size_t slen, long long *value);
int string2l(const char *s, size_t slen, long *lval);
int d2string(char *buf, size_t len, double value);

bool vr_valid_port(int n);

/*
 * Wrappers to send or receive n byte message on a blocking
 * socket descriptor.
 */
#define vr_sendn(_s, _b, _n)    \
    _vr_sendn(_s, _b, (size_t)(_n))

#define vr_recvn(_s, _b, _n)    \
    _vr_recvn(_s, _b, (size_t)(_n))

/*
 * Wrappers to read or write data to/from (multiple) buffers
 * to a file or socket descriptor.
 */
#define vr_read(_d, _b, _n)     \
    read(_d, _b, (size_t)(_n))

#define vr_readv(_d, _b, _n)    \
    readv(_d, _b, (int)(_n))

#define vr_write(_d, _b, _n)    \
    write(_d, _b, (size_t)(_n))

#define vr_writev(_d, _b, _n)   \
    writev(_d, _b, (int)(_n))

ssize_t _vr_sendn(int sd, const void *vptr, size_t n);
ssize_t _vr_recvn(int sd, void *vptr, size_t n);

int64_t vr_usec_now(void);
int64_t vr_msec_now(void);

/*
 * Address resolution for internet (ipv4 and ipv6) and unix domain
 * socket address.
 */

struct sockinfo {
    int       family;              /* socket address family */
    socklen_t addrlen;             /* socket address length */
    union {
        struct sockaddr_in  in;    /* ipv4 socket address */
        struct sockaddr_in6 in6;   /* ipv6 socket address */
        struct sockaddr_un  un;    /* unix domain address */
    } addr;
};

int vr_resolve(sds name, int port, struct sockinfo *si);
int vr_net_format_peer(int fd, char *buf, size_t buf_len);

void get_random_hex_chars(char *p, unsigned int len);

int stringmatchlen(const char *pattern, int patternLen, const char *string, int stringLen, int nocase);
int stringmatch(const char *pattern, const char *string, int nocase);

/*
 * Wrapper around common routines for manipulating C character
 * strings
 */
#define vr_memcpy(_d, _c, _n)           \
    memcpy(_d, _c, (size_t)(_n))

#define vr_memmove(_d, _c, _n)          \
    memmove(_d, _c, (size_t)(_n))

#define vr_memchr(_d, _c, _n)           \
    memchr(_d, _c, (size_t)(_n))

#define vr_strlen(_s)                   \
    strlen((char *)(_s))

#define vr_strncmp(_s1, _s2, _n)        \
    strncmp((char *)(_s1), (char *)(_s2), (size_t)(_n))

#define vr_strchr(_p, _l, _c)           \
    _vr_strchr((uint8_t *)(_p), (uint8_t *)(_l), (uint8_t)(_c))

#define vr_strrchr(_p, _s, _c)          \
    _vr_strrchr((uint8_t *)(_p),(uint8_t *)(_s), (uint8_t)(_c))

#define vr_strndup(_s, _n)              \
    (uint8_t *)strndup((char *)(_s), (size_t)(_n));

static inline uint8_t *
_vr_strchr(uint8_t *p, uint8_t *last, uint8_t c)
{
    while (p < last) {
        if (*p == c) {
            return p;
        }
        p++;
    }

    return NULL;
}

static inline uint8_t *
_vr_strrchr(uint8_t *p, uint8_t *start, uint8_t c)
{
    while (p >= start) {
        if (*p == c) {
            return p;
        }
        p--;
    }

    return NULL;
}

void memrev16(void *p);
void memrev32(void *p);
void memrev64(void *p);
uint16_t intrev16(uint16_t v);
uint32_t intrev32(uint32_t v);
uint64_t intrev64(uint64_t v);

/* variants of the function doing the actual convertion only if the target
 * host is big endian */
#ifdef VR_LITTLE_ENDIAN
#define memrev16ifbe(p)
#define memrev32ifbe(p)
#define memrev64ifbe(p)
#define intrev16ifbe(v) (v)
#define intrev32ifbe(v) (v)
#define intrev64ifbe(v) (v)
#else
#define memrev16ifbe(p) memrev16(p)
#define memrev32ifbe(p) memrev32(p)
#define memrev64ifbe(p) memrev64(p)
#define intrev16ifbe(v) intrev16(v)
#define intrev32ifbe(v) intrev32(v)
#define intrev64ifbe(v) intrev64(v)
#endif

long long memtoll(const char *p, int *err);
void bytesToHuman(char *s, unsigned long long n);

sds getAbsolutePath(char *filename);

#endif


================================================
FILE: src/vr_worker.c
================================================
#include <vr_core.h>

/* Which thread we assigned a connection to most recently. */
static int last_worker_thread = -1;
static int num_worker_threads;

struct darray workers;

static void *worker_thread_run(void *args);

#define SU_PER_ALLOC 64

/* Free list of swapunit structs */
static struct connswapunit *csui_freelist;
static pthread_mutex_t csui_freelist_lock;

/*
 * Returns a fresh connection connswapunit queue item.
 */
struct connswapunit *
csui_new(void) {
    struct connswapunit *item = NULL;
    pthread_mutex_lock(&csui_freelist_lock);
    if (csui_freelist) {
        item = csui_freelist;
        csui_freelist = item->next;
    }
    pthread_mutex_unlock(&csui_freelist_lock);

    if (NULL == item) {
        int i;

        /* Allocate a bunch of items at once to reduce fragmentation */
        item = dalloc(sizeof(struct connswapunit) * SU_PER_ALLOC);
        if (NULL == item) {
            return NULL;
        }

        /*
         * Link together all the new items except the first one
         * (which we'll return to the caller) for placement on
         * the freelist.
         */
        for (i = 2; i < SU_PER_ALLOC; i++)
            item[i - 1].next = &item[i];

        pthread_mutex_lock(&csui_freelist_lock);
        item[SU_PER_ALLOC - 1].next = csui_freelist;
        csui_freelist = &item[1];
        pthread_mutex_unlock(&csui_freelist_lock);
    }

    return item;
}

/*
 * Frees a connection connswapunit queue item (adds it to the freelist.)
 */
void 
csui_free(struct connswapunit *item) {
    pthread_mutex_lock(&csui_freelist_lock);
    item->next = csui_freelist;
    csui_freelist = item;
    pthread_mutex_unlock(&csui_freelist_lock);
}

void
csul_push(vr_worker *worker, struct connswapunit *su)
{
    pthread_mutex_lock(&worker->csullock);
    dlistPush(worker->csul, su);
    pthread_mutex_unlock(&worker->csullock);
}

struct connswapunit *
csul_pop(vr_worker *worker)
{
    struct connswapunit *su = NULL;

    pthread_mutex_lock(&worker->csullock);
    su = dlistPop(worker->csul);
    pthread_mutex_unlock(&worker->csullock);
    
    return su;
}

int
vr_worker_init(vr_worker *worker)
{
    rstatus_t status;
    int maxclients, threads_num;
    int filelimit;
    
    if (worker == NULL) {
        return VR_ERROR;
    }

    worker->id = 0;
    worker->socketpairs[0] = -1;
    worker->socketpairs[1] = -1;
    worker->csul = NULL;
    pthread_mutex_init(&worker->csullock, NULL);
    worker->current_db = 0;
    worker->timelimit_exit = 0;
    worker->last_fast_cycle = 0;
    worker->resize_db = 0;
    worker->rehash_db = 0;

    conf_server_get(CONFIG_SOPN_MAXCLIENTS,&maxclients);
    filelimit = adjustOpenFilesLimit(maxclients);
    if (filelimit <= 0) {
        return VR_ERROR;
    }
    vr_eventloop_init(&worker->vel, filelimit);
    worker->vel.thread.fun_run = worker_thread_run;
    worker->vel.thread.data = worker;
    worker->vel.cstable = commandStatsTableCreate();

    status = socketpair(AF_LOCAL, SOCK_STREAM, 0, worker->socketpairs);
    if (status < 0) {
        log_error("create socketpairs failed: %s", strerror(errno));
        return VR_ERROR;
    }
    status = vr_set_nonblocking(worker->socketpairs[0]);
    if (status < 0) {
        log_error("set socketpairs[0] %d nonblocking failed: %s", 
            worker->socketpairs[0], strerror(errno));
        close(worker->socketpairs[0]);
        worker->socketpairs[0] = -1;
        close(worker->socketpairs[1]);
        worker->socketpairs[1] = -1;
        return VR_ERROR;
    }
    status = vr_set_nonblocking(worker->socketpairs[1]);
    if (status < 0) {
        log_error("set socketpairs[1] %d nonblocking failed: %s", 
            worker->socketpairs[1], strerror(errno));
        close(worker->socketpairs[0]);
        worker->socketpairs[0] = -1;
        close(worker->socketpairs[1]);
        worker->socketpairs[1] = -1;
        return VR_ERROR;
    }

    worker->csul = dlistCreate();
    if (worker->csul == NULL) {
        log_error("create list failed: out of memory");
        return VR_ENOMEM;
    }
    
    return VR_OK;
}

void
vr_worker_deinit(vr_worker *worker)
{
    if (worker == NULL) {
        return;
    }

    vr_eventloop_deinit(&worker->vel);

    if (worker->socketpairs[0] > 0){
        close(worker->socketpairs[0]);
        worker->socketpairs[0] = -1;
    }
    if (worker->socketpairs[1] > 0){
        close(worker->socketpairs[1]);
        worker->socketpairs[1] = -1;
    }

    if (worker->csul != NULL) {
        dlistRelease(worker->csul);
        worker->csul = NULL;
    }
}

int
worker_get_next_idx(int curidx)
{
    int idx = curidx + 1;
    return idx>=num_worker_threads?0:idx;
}

void
dispatch_conn_new(vr_listen *vlisten, int sd)
{
    struct connswapunit *su = csui_new();
    char buf[1];
    vr_worker *worker;

    if (su == NULL) {
        close(sd);
        /* given that malloc failed this may also fail, but let's try */
        log_error("Failed to allocate memory for connection swap object\n");
        return ;
    }
    
    int tid = (last_worker_thread + 1) % num_worker_threads;
    worker = darray_get(&workers, (uint32_t)tid);

    last_worker_thread = tid;

    su->num = sd;
    su->data = vlisten;

    csul_push(worker, su);

    buf[0] = 'c';
    if (vr_write(worker->socketpairs[0], buf, 1) != 1) {
        log_error("Notice the worker failed.");
    }
    
    update_curr_clients_add(1);
}

static void
thread_event_process(aeEventLoop *el, int fd, void *privdata, int mask) {

    rstatus_t status;
    vr_worker *worker = privdata;
    char buf[1];
    int sd;
    vr_listen *vlisten;
    struct conn *conn;
    struct connswapunit *csu;
    client *c;

    ASSERT(el == worker->vel.el);
    ASSERT(fd == worker->socketpairs[1]);

    if (vr_read(fd, buf, 1) != 1) {
        log_warn("Can't read for worker(id:%d) socketpairs[1](%d)", 
            worker->vel.thread.id, fd);
        buf[0] = 'c';
    }
    
    switch (buf[0]) {
    case 'c':
        csu = csul_pop(worker);
        if (csu == NULL) {
            return;
        }
        sd = csu->num;
        vlisten = csu->data;
        csui_free(csu);
        conn = conn_get(worker->vel.cb);
        if (conn == NULL) {
            log_error("get conn for c %d failed: %s", 
                sd, strerror(errno));
            status = close(sd);
            if (status < 0) {
                log_error("close c %d failed, ignored: %s", sd, strerror(errno));
            }
            return;
        }
        conn->sd = sd;
    
        status = vr_set_nonblocking(conn->sd);
        if (status < 0) {
            log_error("set nonblock on c %d failed: %s", 
                conn->sd, strerror(errno));
            conn_put(conn);
            return;
        }
    
        if (vlisten->info.family == AF_INET || vlisten->info.family == AF_INET6) {
            status = vr_set_tcpnodelay(conn->sd);
            if (status < 0) {
                log_warn("set tcpnodelay on c %d failed, ignored: %s",
                    conn->sd, strerror(errno));
            }
        }

        c = createClient(&worker->vel, conn);
        if (c == NULL) {
            log_error("Create client failed");
            conn_put(conn);
            return;
        }
        c->curidx = worker->id;
        status = aeCreateFileEvent(worker->vel.el, conn->sd, AE_READABLE, 
            readQueryFromClient, c);
        if (status == AE_ERR) {
            log_error("Unrecoverable error creating worker ipfd file event.");
            return;
        }

        update_stats_add(c->vel->stats, numconnections, 1);
        
        break;
    case 'j':
        csu = csul_pop(worker);
        if (csu == NULL) {
            return;
        }
        c = csu->data;
        csui_free(csu);
        c->vel = &worker->vel;
        c->curidx = worker->id;
        c->steps ++;
        c->cmd->proc(c);
        
        if (c->flags&CLIENT_JUMP) {
            dispatch_conn_exist(c,c->taridx);
        } else {
            resetClient(c);
            linkClientToEventloop(c,c->vel);
        }
        break;
    default:
        log_error("read error char '%c' for worker(id:%d) socketpairs[1](%d)", 
            buf[0], worker->vel.thread.id, worker->socketpairs[1]);
        break;
    }
}

static int
setup_worker(vr_worker *worker)
{
    rstatus_t status;
    
    status = aeCreateFileEvent(worker->vel.el, worker->socketpairs[1], AE_READABLE, 
        thread_event_process, worker);
    if (status == AE_ERR) {
        log_error("Unrecoverable error creating worker ipfd file event.");
        return VR_ERROR;
    }

    aeSetBeforeSleepProc(worker->vel.el, worker_before_sleep, worker);

    /* Create the serverCron() time event, that's our main way to process
     * background operations. */
    if(aeCreateTimeEvent(worker->vel.el, 1, worker_cron, worker, NULL) == AE_ERR) {
        serverPanic("Can't create the serverCron time event.");
        return VR_ERROR;
    }
    
    return VR_OK;
}

static void *
worker_thread_run(void *args)
{
    vr_worker *worker = args;
    
    /* vire worker run */
    aeMain(worker->vel.el);

    return NULL;
}

int
workers_init(uint32_t worker_count)
{
    rstatus_t status;
    uint32_t idx;
    vr_worker *worker;
    
    csui_freelist = NULL;
    pthread_mutex_init(&csui_freelist_lock, NULL);

    darray_init(&workers, worker_count, sizeof(vr_worker));

    for (idx = 0; idx < worker_count; idx ++) {
        worker = darray_push(&workers);
        vr_worker_init(worker);
        worker->id = idx;
        status = setup_worker(worker);
        if (status != VR_OK) {
            exit(1);
        }
    }
    
    num_worker_threads = (int)darray_n(&workers);

    return VR_OK;
}

int
workers_run(void)
{
    uint32_t i, thread_count;
    vr_worker *worker;

    thread_count = (uint32_t)num_worker_threads;

    for (i = 0; i < thread_count; i ++) {
        worker = darray_get(&workers, i);
        vr_thread_start(&worker->vel.thread);
    }

    return VR_OK;
}

int
workers_wait(void)
{
    uint32_t i, thread_count;
    vr_worker *worker;

    thread_count = (uint32_t)num_worker_threads;

    for (i = 0; i < thread_count; i ++) {
        worker = darray_get(&workers, i);
        pthread_join(worker->vel.thread.thread_id, NULL);
    }

    return VR_OK;
}

void
workers_deinit(void)
{
    vr_worker *worker;

    while(darray_n(&workers)) {
        worker = darray_pop(&workers);
		vr_worker_deinit(worker);
    }
}

/* This function gets called every time Redis is entering the
 * main loop of the event driven library, that is, before to sleep
 * for ready file descriptors. */
void
worker_before_sleep(struct aeEventLoop *eventLoop, void *private_data) {
    vr_worker *worker = private_data;

    UNUSED(eventLoop);
    UNUSED(private_data);

    ASSERT(eventLoop == worker->vel.el);

    /* Handle writes with pending output buffers. */
    handleClientsWithPendingWrites(&worker->vel);

    //activeExpireCycle(worker, ACTIVE_EXPIRE_CYCLE_FAST);
}

int
worker_cron(struct aeEventLoop *eventLoop, long long id, void *clientData) {
    vr_worker *worker = clientData;
    vr_eventloop *vel = &worker->vel;
    size_t stat_used_memory, stats_peak_memory;

    UNUSED(eventLoop);
    UNUSED(id);
    UNUSED(clientData);

    ASSERT(eventLoop == vel->el);

    vel->unixtime = time(NULL);
    vel->mstime = vr_msec_now();

    run_with_period(100, vel->cronloops) {
        long long stats_value;
        update_stats_get(vel->stats,numcommands,&stats_value);
        trackInstantaneousMetric(vel->stats,STATS_METRIC_COMMAND,stats_value);
        update_stats_get(vel->stats,net_input_bytes,&stats_value);
        trackInstantaneousMetric(vel->stats,STATS_METRIC_NET_INPUT,stats_value);
        update_stats_get(vel->stats,net_output_bytes,&stats_value);
        trackInstantaneousMetric(vel->stats,STATS_METRIC_NET_OUTPUT,stats_value);
    }

    /* Sample the RSS here since this is a relatively slow call. */
    run_with_period(1000, vel->cronloops) {
        vel->resident_set_size = dalloc_get_rss();
    }

    /* Record the max memory used since the server was started. */
    /*stat_used_memory = dalloc_used_memory();
    update_stats_get(vel->stats, peak_memory, &stats_peak_memory);
    if (stat_used_memory > stats_peak_memory) {
        update_stats_set(vel->stats, peak_memory, stat_used_memory);
    }*/

    /* Close clients that need to be closed asynchronous */
    freeClientsInAsyncFreeQueue(vel);

    //databasesCron(worker);

    /* Update the config cache */
    run_with_period(1000, vel->cronloops) {
        conf_cache_update(&vel->cc);
    }
    
    vel->cronloops ++;
    return 1000/vel->hz;
}


================================================
FILE: src/vr_worker.h
================================================
#ifndef _VR_WORKER_H_
#define _VR_WORKER_H_

typedef struct vr_worker {

    int id;
    vr_eventloop vel;
    
    int socketpairs[2];         /*0: belong to master thread, 1: belong to myself*/
    
    dlist *csul;    /* Connect swap unit list */
    pthread_mutex_t csullock;   /* swap unit list locker */

    /* Some global state in order to continue the work incrementally 
       * across calls for activeExpireCycle() to expire some keys. */
    unsigned int current_db;    /* Last DB tested. */
    int timelimit_exit;         /* Time limit hit in previous call? */
    long long last_fast_cycle;  /* When last fast cycle ran. */

    /* We use global counters so if we stop the computation at a given
       * DB we'll be able to start from the successive in the next
       * cron loop iteration for databasesCron() to resize and reshash db. */
    unsigned int resize_db;
    unsigned int rehash_db;
}vr_worker;

struct connswapunit {
    int num;
    void *data;
    struct connswapunit *next;
};

extern struct darray workers;

int workers_init(uint32_t worker_count);
int workers_run(void);
int workers_wait(void);
void workers_deinit(void);

struct connswapunit *csui_new(void);
void csui_free(struct connswapunit *item);

void csul_push(vr_worker *worker, struct connswapunit *su);
struct connswapunit *csul_pop(vr_worker *worker);

int worker_get_next_idx(int curidx);

void dispatch_conn_new(vr_listen *vlisten, int sd);

void worker_before_sleep(struct aeEventLoop *eventLoop, void *private_data);
int worker_cron(struct aeEventLoop *eventLoop, long long id, void *clientData);

#endif


================================================
FILE: src/vr_ziplist.c
================================================
/* The ziplist is a specially encoded dually linked list that is designed
 * to be very memory efficient. It stores both strings and integer values,
 * where integers are encoded as actual integers instead of a series of
 * characters. It allows push and pop operations on either side of the list
 * in O(1) time. However, because every operation requires a reallocation of
 * the memory used by the ziplist, the actual complexity is related to the
 * amount of memory used by the ziplist.
 *
 * ----------------------------------------------------------------------------
 *
 * ZIPLIST OVERALL LAYOUT:
 * The general layout of the ziplist is as follows:
 * <zlbytes><zltail><zllen><entry><entry><zlend>
 *
 * <zlbytes> is an unsigned integer to hold the number of bytes that the
 * ziplist occupies. This value needs to be stored to be able to resize the
 * entire structure without the need to traverse it first.
 *
 * <zltail> is the offset to the last entry in the list. This allows a pop
 * operation on the far side of the list without the need for full traversal.
 *
 * <zllen> is the number of entries.When this value is larger than 2**16-2,
 * we need to traverse the entire list to know how many items it holds.
 *
 * <zlend> is a single byte special value, equal to 255, which indicates the
 * end of the list.
 *
 * ZIPLIST ENTRIES:
 * Every entry in the ziplist is prefixed by a header that contains two pieces
 * of information. First, the length of the previous entry is stored to be
 * able to traverse the list from back to front. Second, the encoding with an
 * optional string length of the entry itself is stored.
 *
 * The length of the previous entry is encoded in the following way:
 * If this length is smaller than 254 bytes, it will only consume a single
 * byte that takes the length as value. When the length is greater than or
 * equal to 254, it will consume 5 bytes. The first byte is set to 254 to
 * indicate a larger value is following. The remaining 4 bytes take the
 * length of the previous entry as value.
 *
 * The other header field of the entry itself depends on the contents of the
 * entry. When the entry is a string, the first 2 bits of this header will hold
 * the type of encoding used to store the length of the string, followed by the
 * actual length of the string. When the entry is an integer the first 2 bits
 * are both set to 1. The following 2 bits are used to specify what kind of
 * integer will be stored after this header. An overview of the different
 * types and encodings is as follows:
 *
 * |00pppppp| - 1 byte
 *      String value with length less than or equal to 63 bytes (6 bits).
 * |01pppppp|qqqqqqqq| - 2 bytes
 *      String value with length less than or equal to 16383 bytes (14 bits).
 * |10______|qqqqqqqq|rrrrrrrr|ssssssss|tttttttt| - 5 bytes
 *      String value with length greater than or equal to 16384 bytes.
 * |11000000| - 1 byte
 *      Integer encoded as int16_t (2 bytes).
 * |11010000| - 1 byte
 *      Integer encoded as int32_t (4 bytes).
 * |11100000| - 1 byte
 *      Integer encoded as int64_t (8 bytes).
 * |11110000| - 1 byte
 *      Integer encoded as 24 bit signed (3 bytes).
 * |11111110| - 1 byte
 *      Integer encoded as 8 bit signed (1 byte).
 * |1111xxxx| - (with xxxx between 0000 and 1101) immediate 4 bit integer.
 *      Unsigned integer from 0 to 12. The encoded value is actually from
 *      1 to 13 because 0000 and 1111 can not be used, so 1 should be
 *      subtracted from the encoded 4 bit value to obtain the right value.
 * |11111111| - End of ziplist.
 *
 * All the integers are represented in little endian byte order.
 *
 * ----------------------------------------------------------------------------
 *
 * Copyright (c) 2009-2012, Pieter Noordhuis <pcnoordhuis at gmail dot com>
 * Copyright (c) 2009-2012, Salvatore Sanfilippo <antirez at gmail dot com>
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <stdint.h>
#include <limits.h>

#include <vr_core.h>

#define ZIP_END 255
#define ZIP_BIGLEN 254

/* Different encoding/length possibilities */
#define ZIP_STR_MASK 0xc0
#define ZIP_INT_MASK 0x30
#define ZIP_STR_06B (0 << 6)
#define ZIP_STR_14B (1 << 6)
#define ZIP_STR_32B (2 << 6)
#define ZIP_INT_16B (0xc0 | 0<<4)
#define ZIP_INT_32B (0xc0 | 1<<4)
#define ZIP_INT_64B (0xc0 | 2<<4)
#define ZIP_INT_24B (0xc0 | 3<<4)
#define ZIP_INT_8B 0xfe
/* 4 bit integer immediate encoding */
#define ZIP_INT_IMM_MASK 0x0f
#define ZIP_INT_IMM_MIN 0xf1    /* 11110001 */
#define ZIP_INT_IMM_MAX 0xfd    /* 11111101 */
#define ZIP_INT_IMM_VAL(v) (v & ZIP_INT_IMM_MASK)

#define INT24_MAX 0x7fffff
#define INT24_MIN (-INT24_MAX - 1)

/* Macro to determine type */
#define ZIP_IS_STR(enc) (((enc) & ZIP_STR_MASK) < ZIP_STR_MASK)

/* Utility macros */
#define ZIPLIST_BYTES(zl)       (*((uint32_t*)(zl)))
#define ZIPLIST_TAIL_OFFSET(zl) (*((uint32_t*)((zl)+sizeof(uint32_t))))
#define ZIPLIST_LENGTH(zl)      (*((uint16_t*)((zl)+sizeof(uint32_t)*2)))
#define ZIPLIST_HEADER_SIZE     (sizeof(uint32_t)*2+sizeof(uint16_t))
#define ZIPLIST_END_SIZE        (sizeof(uint8_t))
#define ZIPLIST_ENTRY_HEAD(zl)  ((zl)+ZIPLIST_HEADER_SIZE)
#define ZIPLIST_ENTRY_TAIL(zl)  ((zl)+intrev32ifbe(ZIPLIST_TAIL_OFFSET(zl)))
#define ZIPLIST_ENTRY_END(zl)   ((zl)+intrev32ifbe(ZIPLIST_BYTES(zl))-1)

/* We know a positive increment can only be 1 because entries can only be
 * pushed one at a time. */
#define ZIPLIST_INCR_LENGTH(zl,incr) { \
    if (ZIPLIST_LENGTH(zl) < UINT16_MAX) \
        ZIPLIST_LENGTH(zl) = intrev16ifbe(intrev16ifbe(ZIPLIST_LENGTH(zl))+incr); \
}

typedef struct zlentry {
    unsigned int prevrawlensize, prevrawlen;
    unsigned int lensize, len;
    unsigned int headersize;
    unsigned char encoding;
    unsigned char *p;
} zlentry;

#define ZIPLIST_ENTRY_ZERO(zle) { \
    (zle)->prevrawlensize = (zle)->prevrawlen = 0; \
    (zle)->lensize = (zle)->len = (zle)->headersize = 0; \
    (zle)->encoding = 0; \
    (zle)->p = NULL; \
}

/* Extract the encoding from the byte pointed by 'ptr' and set it into
 * 'encoding'. */
#define ZIP_ENTRY_ENCODING(ptr, encoding) do {  \
    (encoding) = (ptr[0]); \
    if ((encoding) < ZIP_STR_MASK) (encoding) &= ZIP_STR_MASK; \
} while(0)

void ziplistRepr(unsigned char *zl);

/* Return bytes needed to store integer encoded by 'encoding' */
static unsigned int zipIntSize(unsigned char encoding) {
    switch(encoding) {
    case ZIP_INT_8B:  return 1;
    case ZIP_INT_16B: return 2;
    case ZIP_INT_24B: return 3;
    case ZIP_INT_32B: return 4;
    case ZIP_INT_64B: return 8;
    default: return 0; /* 4 bit immediate */
    }
    ASSERT(NULL);
    return 0;
}

/* Encode the length 'rawlen' writing it in 'p'. If p is NULL it just returns
 * the amount of bytes required to encode such a length. */
static unsigned int zipEncodeLength(unsigned char *p, unsigned char encoding, unsigned int rawlen) {
    unsigned char len = 1, buf[5];

    if (ZIP_IS_STR(encoding)) {
        /* Although encoding is given it may not be set for strings,
         * so we determine it here using the raw length. */
        if (rawlen <= 0x3f) {
            if (!p) return len;
            buf[0] = ZIP_STR_06B | rawlen;
        } else if (rawlen <= 0x3fff) {
            len += 1;
            if (!p) return len;
            buf[0] = ZIP_STR_14B | ((rawlen >> 8) & 0x3f);
            buf[1] = rawlen & 0xff;
        } else {
            len += 4;
            if (!p) return len;
            buf[0] = ZIP_STR_32B;
            buf[1] = (rawlen >> 24) & 0xff;
            buf[2] = (rawlen >> 16) & 0xff;
            buf[3] = (rawlen >> 8) & 0xff;
            buf[4] = rawlen & 0xff;
        }
    } else {
        /* Implies integer encoding, so length is always 1. */
        if (!p) return len;
        buf[0] = encoding;
    }

    /* Store this length at p */
    memcpy(p,buf,len);
    return len;
}

/* Decode the length encoded in 'ptr'. The 'encoding' variable will hold the
 * entries encoding, the 'lensize' variable will hold the number of bytes
 * required to encode the entries length, and the 'len' variable will hold the
 * entries length. */
#define ZIP_DECODE_LENGTH(ptr, encoding, lensize, len) do {                    \
    ZIP_ENTRY_ENCODING((ptr), (encoding));                                     \
    if ((encoding) < ZIP_STR_MASK) {                                           \
        if ((encoding) == ZIP_STR_06B) {                                       \
            (lensize) = 1;                                                     \
            (len) = (ptr)[0] & 0x3f;                                           \
        } else if ((encoding) == ZIP_STR_14B) {                                \
            (lensize) = 2;                                                     \
            (len) = (((ptr)[0] & 0x3f) << 8) | (ptr)[1];                       \
        } else if (encoding == ZIP_STR_32B) {                                  \
            (lensize) = 5;                                                     \
            (len) = ((ptr)[1] << 24) |                                         \
                    ((ptr)[2] << 16) |                                         \
                    ((ptr)[3] <<  8) |                                         \
                    ((ptr)[4]);                                                \
        } else {                                                               \
            ASSERT(NULL);                                                      \
        }                                                                      \
    } else {                                                                   \
        (lensize) = 1;                                                         \
        (len) = zipIntSize(encoding);                                          \
    }                                                                          \
} while(0);

/* Encode the length of the previous entry and write it to "p". Return the
 * number of bytes needed to encode this length if "p" is NULL. */
static unsigned int zipPrevEncodeLength(unsigned char *p, unsigned int len) {
    if (p == NULL) {
        return (len < ZIP_BIGLEN) ? 1 : sizeof(len)+1;
    } else {
        if (len < ZIP_BIGLEN) {
            p[0] = len;
            return 1;
        } else {
            p[0] = ZIP_BIGLEN;
            memcpy(p+1,&len,sizeof(len));
            memrev32ifbe(p+1);
            return 1+sizeof(len);
        }
    }
}

/* Encode the length of the previous entry and write it to "p". This only
 * uses the larger encoding (required in __ziplistCascadeUpdate). */
static void zipPrevEncodeLengthForceLarge(unsigned char *p, unsigned int len) {
    if (p == NULL) return;
    p[0] = ZIP_BIGLEN;
    memcpy(p+1,&len,sizeof(len));
    memrev32ifbe(p+1);
}

/* Decode the number of bytes required to store the length of the previous
 * element, from the perspective of the entry pointed to by 'ptr'. */
#define ZIP_DECODE_PREVLENSIZE(ptr, prevlensize) do {                          \
    if ((ptr)[0] < ZIP_BIGLEN) {                                               \
        (prevlensize) = 1;                                                     \
    } else {                                                                   \
        (prevlensize) = 5;                                                     \
    }                                                                          \
} while(0);

/* Decode the length of the previous element, from the perspective of the entry
 * pointed to by 'ptr'. */
#define ZIP_DECODE_PREVLEN(ptr, prevlensize, prevlen) do {                     \
    ZIP_DECODE_PREVLENSIZE(ptr, prevlensize);                                  \
    if ((prevlensize) == 1) {                                                  \
        (prevlen) = (ptr)[0];                                                  \
    } else if ((prevlensize) == 5) {                                           \
        ASSERT(sizeof((prevlensize)) == 4);                                    \
        memcpy(&(prevlen), ((char*)(ptr)) + 1, 4);                             \
        memrev32ifbe(&prevlen);                                                \
    }                                                                          \
} while(0);

/* Return the difference in number of bytes needed to store the length of the
 * previous element 'len', in the entry pointed to by 'p'. */
static int zipPrevLenByteDiff(unsigned char *p, unsigned int len) {
    unsigned int prevlensize;
    ZIP_DECODE_PREVLENSIZE(p, prevlensize);
    return zipPrevEncodeLength(NULL, len) - prevlensize;
}

/* Return the total number of bytes used by the entry pointed to by 'p'. */
static unsigned int zipRawEntryLength(unsigned char *p) {
    unsigned int prevlensize, encoding, lensize, len;
    ZIP_DECODE_PREVLENSIZE(p, prevlensize);
    ZIP_DECODE_LENGTH(p + prevlensize, encoding, lensize, len);
    return prevlensize + lensize + len;
}

/* Check if string pointed to by 'entry' can be encoded as an integer.
 * Stores the integer value in 'v' and its encoding in 'encoding'. */
static int zipTryEncoding(unsigned char *entry, unsigned int entrylen, long long *v, unsigned char *encoding) {
    long long value;

    if (entrylen >= 32 || entrylen == 0) return 0;
    if (string2ll((char*)entry,entrylen,&value)) {
        /* Great, the string can be encoded. Check what's the smallest
         * of our encoding types that can hold this value. */
        if (value >= 0 && value <= 12) {
            *encoding = ZIP_INT_IMM_MIN+value;
        } else if (value >= INT8_MIN && value <= INT8_MAX) {
            *encoding = ZIP_INT_8B;
        } else if (value >= INT16_MIN && value <= INT16_MAX) {
            *encoding = ZIP_INT_16B;
        } else if (value >= INT24_MIN && value <= INT24_MAX) {
            *encoding = ZIP_INT_24B;
        } else if (value >= INT32_MIN && value <= INT32_MAX) {
            *encoding = ZIP_INT_32B;
        } else {
            *encoding = ZIP_INT_64B;
        }
        *v = value;
        return 1;
    }
    return 0;
}

/* Store integer 'value' at 'p', encoded as 'encoding' */
static void zipSaveInteger(unsigned char *p, int64_t value, unsigned char encoding) {
    int16_t i16;
    int32_t i32;
    int64_t i64;
    if (encoding == ZIP_INT_8B) {
        ((int8_t*)p)[0] = (int8_t)value;
    } else if (encoding == ZIP_INT_16B) {
        i16 = value;
        memcpy(p,&i16,sizeof(i16));
        memrev16ifbe(p);
    } else if (encoding == ZIP_INT_24B) {
        i32 = value<<8;
        memrev32ifbe(&i32);
        memcpy(p,((uint8_t*)&i32)+1,sizeof(i32)-sizeof(uint8_t));
    } else if (encoding == ZIP_INT_32B) {
        i32 = value;
        memcpy(p,&i32,sizeof(i32));
        memrev32ifbe(p);
    } else if (encoding == ZIP_INT_64B) {
        i64 = value;
        memcpy(p,&i64,sizeof(i64));
        memrev64ifbe(p);
    } else if (encoding >= ZIP_INT_IMM_MIN && encoding <= ZIP_INT_IMM_MAX) {
        /* Nothing to do, the value is stored in the encoding itself. */
    } else {
        ASSERT(NULL);
    }
}

/* Read integer encoded as 'encoding' from 'p' */
static int64_t zipLoadInteger(unsigned char *p, unsigned char encoding) {
    int16_t i16;
    int32_t i32;
    int64_t i64, ret = 0;
    if (encoding == ZIP_INT_8B) {
        ret = ((int8_t*)p)[0];
    } else if (encoding == ZIP_INT_16B) {
        memcpy(&i16,p,sizeof(i16));
        memrev16ifbe(&i16);
        ret = i16;
    } else if (encoding == ZIP_INT_32B) {
        memcpy(&i32,p,sizeof(i32));
        memrev32ifbe(&i32);
        ret = i32;
    } else if (encoding == ZIP_INT_24B) {
        i32 = 0;
        memcpy(((uint8_t*)&i32)+1,p,sizeof(i32)-sizeof(uint8_t));
        memrev32ifbe(&i32);
        ret = i32>>8;
    } else if (encoding == ZIP_INT_64B) {
        memcpy(&i64,p,sizeof(i64));
        memrev64ifbe(&i64);
        ret = i64;
    } else if (encoding >= ZIP_INT_IMM_MIN && encoding <= ZIP_INT_IMM_MAX) {
        ret = (encoding & ZIP_INT_IMM_MASK)-1;
    } else {
        ASSERT(NULL);
    }
    return ret;
}

/* Return a struct with all information about an entry. */
static void zipEntry(unsigned char *p, zlentry *e) {

    ZIP_DECODE_PREVLEN(p, e->prevrawlensize, e->prevrawlen);
    ZIP_DECODE_LENGTH(p + e->prevrawlensize, e->encoding, e->lensize, e->len);
    e->headersize = e->prevrawlensize + e->lensize;
    e->p = p;
}

/* Create a new empty ziplist. */
unsigned char *ziplistNew(void) {
    unsigned int bytes = ZIPLIST_HEADER_SIZE+1;
    unsigned char *zl = dalloc(bytes);
    ZIPLIST_BYTES(zl) = intrev32ifbe(bytes);
    ZIPLIST_TAIL_OFFSET(zl) = intrev32ifbe(ZIPLIST_HEADER_SIZE);
    ZIPLIST_LENGTH(zl) = 0;
    zl[bytes-1] = ZIP_END;
    return zl;
}

/* Resize the ziplist. */
static unsigned char *ziplistResize(unsigned char *zl, unsigned int len) {
    zl = drealloc(zl,len);
    ZIPLIST_BYTES(zl) = intrev32ifbe(len);
    zl[len-1] = ZIP_END;
    return zl;
}

/* When an entry is inserted, we need to set the prevlen field of the next
 * entry to equal the length of the inserted entry. It can occur that this
 * length cannot be encoded in 1 byte and the next entry needs to be grow
 * a bit larger to hold the 5-byte encoded prevlen. This can be done for free,
 * because this only happens when an entry is already being inserted (which
 * causes a realloc and memmove). However, encoding the prevlen may require
 * that this entry is grown as well. This effect may cascade throughout
 * the ziplist when there are consecutive entries with a size close to
 * ZIP_BIGLEN, so we need to check that the prevlen can be encoded in every
 * consecutive entry.
 *
 * Note that this effect can also happen in reverse, where the bytes required
 * to encode the prevlen field can shrink. This effect is deliberately ignored,
 * because it can cause a "flapping" effect where a chain prevlen fields is
 * first grown and then shrunk again after consecutive inserts. Rather, the
 * field is allowed to stay larger than necessary, because a large prevlen
 * field implies the ziplist is holding large entries anyway.
 *
 * The pointer "p" points to the first entry that does NOT need to be
 * updated, i.e. consecutive fields MAY need an update. */
static unsigned char *__ziplistCascadeUpdate(unsigned char *zl, unsigned char *p) {
    size_t curlen = intrev32ifbe(ZIPLIST_BYTES(zl)), rawlen, rawlensize;
    size_t offset, noffset, extra;
    unsigned char *np;
    zlentry cur, next;

    while (p[0] != ZIP_END) {
        zipEntry(p, &cur);
        rawlen = cur.headersize + cur.len;
        rawlensize = zipPrevEncodeLength(NULL,rawlen);

        /* Abort if there is no next entry. */
        if (p[rawlen] == ZIP_END) break;
        zipEntry(p+rawlen, &next);

        /* Abort when "prevlen" has not changed. */
        if (next.prevrawlen == rawlen) break;

        if (next.prevrawlensize < rawlensize) {
            /* The "prevlen" field of "next" needs more bytes to hold
             * the raw length of "cur". */
            offset = p-zl;
            extra = rawlensize-next.prevrawlensize;
            zl = ziplistResize(zl,curlen+extra);
            p = zl+offset;

            /* Current pointer and offset for next element. */
            np = p+rawlen;
            noffset = np-zl;

            /* Update tail offset when next element is not the tail element. */
            if ((zl+intrev32ifbe(ZIPLIST_TAIL_OFFSET(zl))) != np) {
                ZIPLIST_TAIL_OFFSET(zl) =
                    intrev32ifbe(intrev32ifbe(ZIPLIST_TAIL_OFFSET(zl))+extra);
            }

            /* Move the tail to the back. */
            memmove(np+rawlensize,
                np+next.prevrawlensize,
                curlen-noffset-next.prevrawlensize-1);
            zipPrevEncodeLength(np,rawlen);

            /* Advance the cursor */
            p += rawlen;
            curlen += extra;
        } else {
            if (next.prevrawlensize > rawlensize) {
                /* This would result in shrinking, which we want to avoid.
                 * So, set "rawlen" in the available bytes. */
                zipPrevEncodeLengthForceLarge(p+rawlen,rawlen);
            } else {
                zipPrevEncodeLength(p+rawlen,rawlen);
            }

            /* Stop here, as the raw length of "next" has not changed. */
            break;
        }
    }
    return zl;
}

/* Delete "num" entries, starting at "p". Returns pointer to the ziplist. */
static unsigned char *__ziplistDelete(unsigned char *zl, unsigned char *p, unsigned int num) {
    unsigned int i, totlen, deleted = 0;
    size_t offset;
    int nextdiff = 0;
    zlentry first, tail;

    zipEntry(p, &first);
    for (i = 0; p[0] != ZIP_END && i < num; i++) {
        p += zipRawEntryLength(p);
        deleted++;
    }

    totlen = p-first.p;
    if (totlen > 0) {
        if (p[0] != ZIP_END) {
            /* Storing `prevrawlen` in this entry may increase or decrease the
             * number of bytes required compare to the current `prevrawlen`.
             * There always is room to store this, because it was previously
             * stored by an entry that is now being deleted. */
            nextdiff = zipPrevLenByteDiff(p,first.prevrawlen);
            p -= nextdiff;
            zipPrevEncodeLength(p,first.prevrawlen);

            /* Update offset for tail */
            ZIPLIST_TAIL_OFFSET(zl) =
                intrev32ifbe(intrev32ifbe(ZIPLIST_TAIL_OFFSET(zl))-totlen);

            /* When the tail contains more than one entry, we need to take
             * "nextdiff" in account as well. Otherwise, a change in the
             * size of prevlen doesn't have an effect on the *tail* offset. */
            zipEntry(p, &tail);
            if (p[tail.headersize+tail.len] != ZIP_END) {
                ZIPLIST_TAIL_OFFSET(zl) =
                   intrev32ifbe(intrev32ifbe(ZIPLIST_TAIL_OFFSET(zl))+nextdiff);
            }

            /* Move tail to the front of the ziplist */
            memmove(first.p,p,
                intrev32ifbe(ZIPLIST_BYTES(zl))-(p-zl)-1);
        } else {
            /* The entire tail was deleted. No need to move memory. */
            ZIPLIST_TAIL_OFFSET(zl) =
                intrev32ifbe((first.p-zl)-first.prevrawlen);
        }

        /* Resize and update length */
        offset = first.p-zl;
        zl = ziplistResize(zl, intrev32ifbe(ZIPLIST_BYTES(zl))-totlen+nextdiff);
        ZIPLIST_INCR_LENGTH(zl,-deleted);
        p = zl+offset;

        /* When nextdiff != 0, the raw length of the next entry has changed, so
         * we need to cascade the update throughout the ziplist */
        if (nextdiff != 0)
            zl = __ziplistCascadeUpdate(zl,p);
    }
    return zl;
}

/* Insert item at "p". */
static unsigned char *__ziplistInsert(unsigned char *zl, unsigned char *p, unsigned char *s, unsigned int slen) {
    size_t curlen = intrev32ifbe(ZIPLIST_BYTES(zl)), reqlen;
    unsigned int prevlensize, prevlen = 0;
    size_t offset;
    int nextdiff = 0;
    unsigned char encoding = 0;
    long long value = 123456789; /* initialized to avoid warning. Using a value
                                    that is easy to see if for some reason
                                    we use it uninitialized. */
    zlentry tail;

    /* Find out prevlen for the entry that is inserted. */
    if (p[0] != ZIP_END) {
        ZIP_DECODE_PREVLEN(p, prevlensize, prevlen);
    } else {
        unsigned char *ptail = ZIPLIST_ENTRY_TAIL(zl);
        if (ptail[0] != ZIP_END) {
            prevlen = zipRawEntryLength(ptail);
        }
    }

    /* See if the entry can be encoded */
    if (zipTryEncoding(s,slen,&value,&encoding)) {
        /* 'encoding' is set to the appropriate integer encoding */
        reqlen = zipIntSize(encoding);
    } else {
        /* 'encoding' is untouched, however zipEncodeLength will use the
         * string length to figure out how to encode it. */
        reqlen = slen;
    }
    /* We need space for both the length of the previous entry and
     * the length of the payload. */
    reqlen += zipPrevEncodeLength(NULL,prevlen);
    reqlen += zipEncodeLength(NULL,encoding,slen);

    /* When the insert position is not equal to the tail, we need to
     * make sure that the next entry can hold this entry's length in
     * its prevlen field. */
    nextdiff = (p[0] != ZIP_END) ? zipPrevLenByteDiff(p,reqlen) : 0;

    /* Store offset because a realloc may change the address of zl. */
    offset = p-zl;
    zl = ziplistResize(zl,curlen+reqlen+nextdiff);
    p = zl+offset;

    /* Apply memory move when necessary and update tail offset. */
    if (p[0] != ZIP_END) {
        /* Subtract one because of the ZIP_END bytes */
        memmove(p+reqlen,p-nextdiff,curlen-offset-1+nextdiff);

        /* Encode this entry's raw length in the next entry. */
        zipPrevEncodeLength(p+reqlen,reqlen);

        /* Update offset for tail */
        ZIPLIST_TAIL_OFFSET(zl) =
            intrev32ifbe(intrev32ifbe(ZIPLIST_TAIL_OFFSET(zl))+reqlen);

        /* When the tail contains more than one entry, we need to take
         * "nextdiff" in account as well. Otherwise, a change in the
         * size of prevlen doesn't have an effect on the *tail* offset. */
        zipEntry(p+reqlen, &tail);
        if (p[reqlen+tail.headersize+tail.len] != ZIP_END) {
            ZIPLIST_TAIL_OFFSET(zl) =
                intrev32ifbe(intrev32ifbe(ZIPLIST_TAIL_OFFSET(zl))+nextdiff);
        }
    } else {
        /* This element will be the new tail. */
        ZIPLIST_TAIL_OFFSET(zl) = intrev32ifbe(p-zl);
    }

    /* When nextdiff != 0, the raw length of the next entry has changed, so
     * we need to cascade the update throughout the ziplist */
    if (nextdiff != 0) {
        offset = p-zl;
        zl = __ziplistCascadeUpdate(zl,p+reqlen);
        p = zl+offset;
    }

    /* Write the entry */
    p += zipPrevEncodeLength(p,prevlen);
    p += zipEncodeLength(p,encoding,slen);
    if (ZIP_IS_STR(encoding)) {
        memcpy(p,s,slen);
    } else {
        zipSaveInteger(p,value,encoding);
    }
    ZIPLIST_INCR_LENGTH(zl,1);
    return zl;
}

/* Merge ziplists 'first' and 'second' by appending 'second' to 'first'.
 *
 * NOTE: The larger ziplist is reallocated to contain the new merged ziplist.
 * Either 'first' or 'second' can be used for the result.  The parameter not
 * used will be free'd and set to NULL.
 *
 * After calling this function, the input parameters are no longer valid since
 * they are changed and free'd in-place.
 *
 * The result ziplist is the contents of 'first' followed by 'second'.
 *
 * On failure: returns NULL if the merge is impossible.
 * On success: returns the merged ziplist (which is expanded version of either
 * 'first' or 'second', also frees the other unused input ziplist, and sets the
 * input ziplist argument equal to newly reallocated ziplist return value. */
unsigned char *ziplistMerge(unsigned char **first, unsigned char **second) {
    /* If any params are null, we can't merge, so NULL. */
    if (first == NULL || *first == NULL || second == NULL || *second == NULL)
        return NULL;

    /* Can't merge same list into itself. */
    if (*first == *second)
        return NULL;

    size_t first_bytes = intrev32ifbe(ZIPLIST_BYTES(*first));
    size_t first_len = intrev16ifbe(ZIPLIST_LENGTH(*first));

    size_t second_bytes = intrev32ifbe(ZIPLIST_BYTES(*second));
    size_t second_len = intrev16ifbe(ZIPLIST_LENGTH(*second));

    int append;
    unsigned char *source, *target;
    size_t target_bytes, source_bytes;
    /* Pick the largest ziplist so we can resize easily in-place.
     * We must also track if we are now appending or prepending to
     * the target ziplist. */
    if (first_len >= second_len) {
        /* retain first, append second to first. */
        target = *first;
        target_bytes = first_bytes;
        source = *second;
        source_bytes = second_bytes;
        append = 1;
    } else {
        /* else, retain second, prepend first to second. */
        target = *second;
        target_bytes = second_bytes;
        source = *first;
        source_bytes = first_bytes;
        append = 0;
    }

    /* Calculate final bytes (subtract one pair of metadata) */
    size_t zlbytes = first_bytes + second_bytes -
                     ZIPLIST_HEADER_SIZE - ZIPLIST_END_SIZE;
    size_t zllength = first_len + second_len;

    /* Combined zl length should be limited within UINT16_MAX */
    zllength = zllength < UINT16_MAX ? zllength : UINT16_MAX;

    /* Save offset positions before we start ripping memory apart. */
    size_t first_offset = intrev32ifbe(ZIPLIST_TAIL_OFFSET(*first));
    size_t second_offset = intrev32ifbe(ZIPLIST_TAIL_OFFSET(*second));

    /* Extend target to new zlbytes then append or prepend source. */
    target = drealloc(target, zlbytes);
    if (append) {
        /* append == appending to target */
        /* Copy source after target (copying over original [END]):
         *   [TARGET - END, SOURCE - HEADER] */
        memcpy(target + target_bytes - ZIPLIST_END_SIZE,
               source + ZIPLIST_HEADER_SIZE,
               source_bytes - ZIPLIST_HEADER_SIZE);
    } else {
        /* !append == prepending to target */
        /* Move target *contents* exactly size of (source - [END]),
         * then copy source into vacataed space (source - [END]):
         *   [SOURCE - END, TARGET - HEADER] */
        memmove(target + source_bytes - ZIPLIST_END_SIZE,
                target + ZIPLIST_HEADER_SIZE,
                target_bytes - ZIPLIST_HEADER_SIZE);
        memcpy(target, source, source_bytes - ZIPLIST_END_SIZE);
    }

    /* Update header metadata. */
    ZIPLIST_BYTES(target) = intrev32ifbe(zlbytes);
    ZIPLIST_LENGTH(target) = intrev16ifbe(zllength);
    /* New tail offset is:
     *   + N bytes of first ziplist
     *   - 1 byte for [END] of first ziplist
     *   + M bytes for the offset of the original tail of the second ziplist
     *   - J bytes for HEADER because second_offset keeps no header. */
    ZIPLIST_TAIL_OFFSET(target) = intrev32ifbe(
                                   (first_bytes - ZIPLIST_END_SIZE) +
                                   (second_offset - ZIPLIST_HEADER_SIZE));

    /* __ziplistCascadeUpdate just fixes the prev length values until it finds a
     * correct prev length value (then it assumes the rest of the list is okay).
     * We tell CascadeUpdate to start at the first ziplist's tail element to fix
     * the merge seam. */
    target = __ziplistCascadeUpdate(target, target+first_offset);

    /* Now free and NULL out what we didn't realloc */
    if (append) {
        dfree(*second);
        *second = NULL;
        *first = target;
    } else {
        dfree(*first);
        *first = NULL;
        *second = target;
    }
    return target;
}

unsigned char *ziplistPush(unsigned char *zl, unsigned char *s, unsigned int slen, int where) {
    unsigned char *p;
    p = (where == ZIPLIST_HEAD) ? ZIPLIST_ENTRY_HEAD(zl) : ZIPLIST_ENTRY_END(zl);
    return __ziplistInsert(zl,p,s,slen);
}

/* Returns an offset to use for iterating with ziplistNext. When the given
 * index is negative, the list is traversed back to front. When the list
 * doesn't contain an element at the provided index, NULL is returned. */
unsigned char *ziplistIndex(unsigned char *zl, int index) {
    unsigned char *p;
    unsigned int prevlensize, prevlen = 0;
    if (index < 0) {
        index = (-index)-1;
        p = ZIPLIST_ENTRY_TAIL(zl);
        if (p[0] != ZIP_END) {
            ZIP_DECODE_PREVLEN(p, prevlensize, prevlen);
            while (prevlen > 0 && index--) {
                p -= prevlen;
                ZIP_DECODE_PREVLEN(p, prevlensize, prevlen);
            }
        }
    } else {
        p = ZIPLIST_ENTRY_HEAD(zl);
        while (p[0] != ZIP_END && index--) {
            p += zipRawEntryLength(p);
        }
    }
    return (p[0] == ZIP_END || index > 0) ? NULL : p;
}

/* Return pointer to next entry in ziplist.
 *
 * zl is the pointer to the ziplist
 * p is the pointer to the current element
 *
 * The element after 'p' is returned, otherwise NULL if we are at the end. */
unsigned char *ziplistNext(unsigned char *zl, unsigned char *p) {
    ((void) zl);

    /* "p" could be equal to ZIP_END, caused by ziplistDelete,
     * and we should return NULL. Otherwise, we should return NULL
     * when the *next* element is ZIP_END (there is no next entry). */
    if (p[0] == ZIP_END) {
        return NULL;
    }

    p += zipRawEntryLength(p);
    if (p[0] == ZIP_END) {
        return NULL;
    }

    return p;
}

/* Return pointer to previous entry in ziplist. */
unsigned char *ziplistPrev(unsigned char *zl, unsigned char *p) {
    unsigned int prevlensize, prevlen = 0;

    /* Iterating backwards from ZIP_END should return the tail. When "p" is
     * equal to the first element of the list, we're already at the head,
     * and should return NULL. */
    if (p[0] == ZIP_END) {
        p = ZIPLIST_ENTRY_TAIL(zl);
        return (p[0] == ZIP_END) ? NULL : p;
    } else if (p == ZIPLIST_ENTRY_HEAD(zl)) {
        return NULL;
    } else {
        ZIP_DECODE_PREVLEN(p, prevlensize, prevlen);
        ASSERT(prevlen > 0);
        return p-prevlen;
    }
}

/* Get entry pointed to by 'p' and store in either '*sstr' or 'sval' depending
 * on the encoding of the entry. '*sstr' is always set to NULL to be able
 * to find out whether the string pointer or the integer value was set.
 * Return 0 if 'p' points to the end of the ziplist, 1 otherwise. */
unsigned int ziplistGet(unsigned char *p, unsigned char **sstr, unsigned int *slen, long long *sval) {
    zlentry entry;
    if (p == NULL || p[0] == ZIP_END) return 0;
    if (sstr) *sstr = NULL;

    zipEntry(p, &entry);
    if (ZIP_IS_STR(entry.encoding)) {
        if (sstr) {
            *slen = entry.len;
            *sstr = p+entry.headersize;
        }
    } else {
        if (sval) {
            *sval = zipLoadInteger(p+entry.headersize,entry.encoding);
        }
    }
    return 1;
}

/* Insert an entry at "p". */
unsigned char *ziplistInsert(unsigned char *zl, unsigned char *p, unsigned char *s, unsigned int slen) {
    return __ziplistInsert(zl,p,s,slen);
}

/* Delete a single entry from the ziplist, pointed to by *p.
 * Also update *p in place, to be able to iterate over the
 * ziplist, while deleting entries. */
unsigned char *ziplistDelete(unsigned char *zl, unsigned char **p) {
    size_t offset = *p-zl;
    zl = __ziplistDelete(zl,*p,1);

    /* Store pointer to current element in p, because ziplistDelete will
     * do a realloc which might result in a different "zl"-pointer.
     * When the delete direction is back to front, we might delete the last
     * entry and end up with "p" pointing to ZIP_END, so check this. */
    *p = zl+offset;
    return zl;
}

/* Delete a range of entries from the ziplist. */
unsigned char *ziplistDeleteRange(unsigned char *zl, int index, unsigned int num) {
    unsigned char *p = ziplistIndex(zl,index);
    return (p == NULL) ? zl : __ziplistDelete(zl,p,num);
}

/* Compare entry pointer to by 'p' with 'sstr' of length 'slen'. */
/* Return 1 if equal. */
unsigned int ziplistCompare(unsigned char *p, unsigned char *sstr, unsigned int slen) {
    zlentry entry;
    unsigned char sencoding;
    long long zval, sval;
    if (p[0] == ZIP_END) return 0;

    zipEntry(p, &entry);
    if (ZIP_IS_STR(entry.encoding)) {
        /* Raw compare */
        if (entry.len == slen) {
            return memcmp(p+entry.headersize,sstr,slen) == 0;
        } else {
            return 0;
        }
    } else {
        /* Try to compare encoded values. Don't compare encoding because
         * different implementations may encoded integers differently. */
        if (zipTryEncoding(sstr,slen,&sval,&sencoding)) {
          zval = zipLoadInteger(p+entry.headersize,entry.encoding);
          return zval == sval;
        }
    }
    return 0;
}

/* Find pointer to the entry equal to the specified entry. Skip 'skip' entries
 * between every comparison. Returns NULL when the field could not be found. */
unsigned char *ziplistFind(unsigned char *p, unsigned char *vstr, unsigned int vlen, unsigned int skip) {
    int skipcnt = 0;
    unsigned char vencoding = 0;
    long long vll = 0;

    while (p[0] != ZIP_END) {
        unsigned int prevlensize, encoding, lensize, len;
        unsigned char *q;

        ZIP_DECODE_PREVLENSIZE(p, prevlensize);
        ZIP_DECODE_LENGTH(p + prevlensize, encoding, lensize, len);
        q = p + prevlensize + lensize;

        if (skipcnt == 0) {
            /* Compare current entry with specified entry */
            if (ZIP_IS_STR(encoding)) {
                if (len == vlen && memcmp(q, vstr, vlen) == 0) {
                    return p;
                }
            } else {
                /* Find out if the searched field can be encoded. Note that
                 * we do it only the first time, once done vencoding is set
                 * to non-zero and vll is set to the integer value. */
                if (vencoding == 0) {
                    if (!zipTryEncoding(vstr, vlen, &vll, &vencoding)) {
                        /* If the entry can't be encoded we set it to
                         * UCHAR_MAX so that we don't retry again the next
                         * time. */
                        vencoding = UCHAR_MAX;
                    }
                    /* Must be non-zero by now */
                    ASSERT(vencoding);
                }

                /* Compare current entry with specified entry, do it only
                 * if vencoding != UCHAR_MAX because if there is no encoding
                 * possible for the field it can't be a valid integer. */
                if (vencoding != UCHAR_MAX) {
                    long long ll = zipLoadInteger(q, encoding);
                    if (ll == vll) {
                        return p;
                    }
                }
            }

            /* Reset skip count */
            skipcnt = skip;
        } else {
            /* Skip entry */
            skipcnt--;
        }

        /* Move to next entry */
        p = q + len;
    }

    return NULL;
}

/* Return length of ziplist. */
unsigned int ziplistLen(unsigned char *zl) {
    unsigned int len = 0;
    if (intrev16ifbe(ZIPLIST_LENGTH(zl)) < UINT16_MAX) {
        len = intrev16ifbe(ZIPLIST_LENGTH(zl));
    } else {
        unsigned char *p = zl+ZIPLIST_HEADER_SIZE;
        while (*p != ZIP_END) {
            p += zipRawEntryLength(p);
            len++;
        }

        /* Re-store length if small enough */
        if (len < UINT16_MAX) ZIPLIST_LENGTH(zl) = intrev16ifbe(len);
    }
    return len;
}

/* Return ziplist blob size in bytes. */
size_t ziplistBlobLen(unsigned char *zl) {
    return intrev32ifbe(ZIPLIST_BYTES(zl));
}

void ziplistRepr(unsigned char *zl) {
    unsigned char *p;
    int index = 0;
    zlentry entry;

    printf(
        "{total bytes %d} "
        "{length %u}\n"
        "{tail offset %u}\n",
        intrev32ifbe(ZIPLIST_BYTES(zl)),
        intrev16ifbe(ZIPLIST_LENGTH(zl)),
        intrev32ifbe(ZIPLIST_TAIL_OFFSET(zl)));
    p = ZIPLIST_ENTRY_HEAD(zl);
    while(*p != ZIP_END) {
        zipEntry(p, &entry);
        printf(
            "{"
                "addr 0x%08lx, "
                "index %2d, "
                "offset %5ld, "
                "rl: %5u, "
                "hs %2u, "
                "pl: %5u, "
                "pls: %2u, "
                "payload %5u"
            "} ",
            (long unsigned)p,
            index,
            (unsigned long) (p-zl),
            entry.headersize+entry.len,
            entry.headersize,
            entry.prevrawlen,
            entry.prevrawlensize,
            entry.len);
        p += entry.headersize;
        if (ZIP_IS_STR(entry.encoding)) {
            if (entry.len > 40) {
                if (fwrite(p,40,1,stdout) == 0) perror("fwrite");
                printf("...");
            } else {
                if (entry.len &&
                    fwrite(p,entry.len,1,stdout) == 0) perror("fwrite");
            }
        } else {
            printf("%lld", (long long) zipLoadInteger(p,entry.encoding));
        }
        printf("\n");
        p += entry.len;
        index++;
    }
    printf("{end}\n\n");
}

#ifdef REDIS_TEST
#include <sys/time.h>
#include "adlist.h"
#include "sds.h"

#define debug(f, ...) { if (DEBUG) printf(f, __VA_ARGS__); }

static unsigned char *createList() {
    unsigned char *zl = ziplistNew();
    zl = ziplistPush(zl, (unsigned char*)"foo", 3, ZIPLIST_TAIL);
    zl = ziplistPush(zl, (unsigned char*)"quux", 4, ZIPLIST_TAIL);
    zl = ziplistPush(zl, (unsigned char*)"hello", 5, ZIPLIST_HEAD);
    zl = ziplistPush(zl, (unsigned char*)"1024", 4, ZIPLIST_TAIL);
    return zl;
}

static unsigned char *createIntList() {
    unsigned char *zl = ziplistNew();
    char buf[32];

    sprintf(buf, "100");
    zl = ziplistPush(zl, (unsigned char*)buf, strlen(buf), ZIPLIST_TAIL);
    sprintf(buf, "128000");
    zl = ziplistPush(zl, (unsigned char*)buf, strlen(buf), ZIPLIST_TAIL);
    sprintf(buf, "-100");
    zl = ziplistPush(zl, (unsigned char*)buf, strlen(buf), ZIPLIST_HEAD);
    sprintf(buf, "4294967296");
    zl = ziplistPush(zl, (unsigned char*)buf, strlen(buf), ZIPLIST_HEAD);
    sprintf(buf, "non integer");
    zl = ziplistPush(zl, (unsigned char*)buf, strlen(buf), ZIPLIST_TAIL);
    sprintf(buf, "much much longer non integer");
    zl = ziplistPush(zl, (unsigned char*)buf, strlen(buf), ZIPLIST_TAIL);
    return zl;
}

static long long usec(void) {
    struct timeval tv;
    gettimeofday(&tv,NULL);
    return (((long long)tv.tv_sec)*1000000)+tv.tv_usec;
}

static void stress(int pos, int num, int maxsize, int dnum) {
    int i,j,k;
    unsigned char *zl;
    char posstr[2][5] = { "HEAD", "TAIL" };
    long long start;
    for (i = 0; i < maxsize; i+=dnum) {
        zl = ziplistNew();
        for (j = 0; j < i; j++) {
            zl = ziplistPush(zl,(unsigned char*)"quux",4,ZIPLIST_TAIL);
        }

        /* Do num times a push+pop from pos */
        start = usec();
        for (k = 0; k < num; k++) {
            zl = ziplistPush(zl,(unsigned char*)"quux",4,pos);
            zl = ziplistDeleteRange(zl,0,1);
        }
        printf("List size: %8d, bytes: %8d, %dx push+pop (%s): %6lld usec\n",
            i,intrev32ifbe(ZIPLIST_BYTES(zl)),num,posstr[pos],usec()-start);
        dfree(zl);
    }
}

static unsigned char *pop(unsigned char *zl, int where) {
    unsigned char *p, *vstr;
    unsigned int vlen;
    long long vlong;

    p = ziplistIndex(zl,where == ZIPLIST_HEAD ? 0 : -1);
    if (ziplistGet(p,&vstr,&vlen,&vlong)) {
        if (where == ZIPLIST_HEAD)
            printf("Pop head: ");
        else
            printf("Pop tail: ");

        if (vstr) {
            if (vlen && fwrite(vstr,vlen,1,stdout) == 0) perror("fwrite");
        }
        else {
            printf("%lld", vlong);
        }

        printf("\n");
        return ziplistDelete(zl,&p);
    } else {
        printf("ERROR: Could not pop\n");
        exit(1);
    }
}

static int randstring(char *target, unsigned int min, unsigned int max) {
    int p = 0;
    int len = min+rand()%(max-min+1);
    int minval, maxval;
    switch(rand() % 3) {
    case 0:
        minval = 0;
        maxval = 255;
    break;
    case 1:
        minval = 48;
        maxval = 122;
    break;
    case 2:
        minval = 48;
        maxval = 52;
    break;
    default:
        ASSERT(NULL);
    }

    while(p < len)
        target[p++] = minval+rand()%(maxval-minval+1);
    return len;
}

static void verify(unsigned char *zl, zlentry *e) {
    int len = ziplistLen(zl);
    zlentry _e;

    ZIPLIST_ENTRY_ZERO(&_e);

    for (int i = 0; i < len; i++) {
        memset(&e[i], 0, sizeof(zlentry));
        zipEntry(ziplistIndex(zl, i), &e[i]);

        memset(&_e, 0, sizeof(zlentry));
        zipEntry(ziplistIndex(zl, -len+i), &_e);

        ASSERT(memcmp(&e[i], &_e, sizeof(zlentry)) == 0);
    }
}

int ziplistTest(int argc, char **argv) {
    int ret;
    unsigned char *zl, *p;
    unsigned char *entry;
    unsigned int elen;
    long long value;

    /* If an argument is given, use it as the random seed. */
    if (argc == 2)
        srand(atoi(argv[1]));

    zl = createIntList();
    ziplistRepr(zl);

    dfree(zl);

    zl = createList();
    ziplistRepr(zl);

    zl = pop(zl,ZIPLIST_TAIL);
    ziplistRepr(zl);

    zl = pop(zl,ZIPLIST_HEAD);
    ziplistRepr(zl);

    zl = pop(zl,ZIPLIST_TAIL);
    ziplistRepr(zl);

    zl = pop(zl,ZIPLIST_TAIL);
    ziplistRepr(zl);

    dfree(zl);

    printf("Get element at index 3:\n");
    {
        zl = createList();
        p = ziplistIndex(zl, 3);
        if (!ziplistGet(p, &entry, &elen, &value)) {
            printf("ERROR: Could not access index 3\n");
            return 1;
        }
        if (entry) {
            if (elen && fwrite(entry,elen,1,stdout) == 0) perror("fwrite");
            printf("\n");
        } else {
            printf("%lld\n", value);
        }
        printf("\n");
        dfree(zl);
    }

    printf("Get element at index 4 (out of range):\n");
    {
        zl = createList();
        p = ziplistIndex(zl, 4);
        if (p == NULL) {
            printf("No entry\n");
        } else {
            printf("ERROR: Out of range index should return NULL, returned offset: %ld\n", p-zl);
            return 1;
        }
        printf("\n");
        dfree(zl);
    }

    printf("Get element at index -1 (last element):\n");
    {
        zl = createList();
        p = ziplistIndex(zl, -1);
        if (!ziplistGet(p, &entry, &elen, &value)) {
            printf("ERROR: Could not access index -1\n");
            return 1;
        }
        if (entry) {
            if (elen && fwrite(entry,elen,1,stdout) == 0) perror("fwrite");
            printf("\n");
        } else {
            printf("%lld\n", value);
        }
        printf("\n");
        dfree(zl);
    }

    printf("Get element at index -4 (first element):\n");
    {
        zl = createList();
        p = ziplistIndex(zl, -4);
        if (!ziplistGet(p, &entry, &elen, &value)) {
            printf("ERROR: Could not access index -4\n");
            return 1;
        }
        if (entry) {
            if (elen && fwrite(entry,elen,1,stdout) == 0) perror("fwrite");
            printf("\n");
        } else {
            printf("%lld\n", value);
        }
        printf("\n");
        dfree(zl);
    }

    printf("Get element at index -5 (reverse out of range):\n");
    {
        zl = createList();
        p = ziplistIndex(zl, -5);
        if (p == NULL) {
            printf("No entry\n");
        } else {
            printf("ERROR: Out of range index should return NULL, returned offset: %ld\n", p-zl);
            return 1;
        }
        printf("\n");
        dfree(zl);
    }

    printf("Iterate list from 0 to end:\n");
    {
        zl = createList();
        p = ziplistIndex(zl, 0);
        while (ziplistGet(p, &entry, &elen, &value)) {
            printf("Entry: ");
            if (entry) {
                if (elen && fwrite(entry,elen,1,stdout) == 0) perror("fwrite");
            } else {
                printf("%lld", value);
            }
            p = ziplistNext(zl,p);
            printf("\n");
        }
        printf("\n");
        dfree(zl);
    }

    printf("Iterate list from 1 to end:\n");
    {
        zl = createList();
        p = ziplistIndex(zl, 1);
        while (ziplistGet(p, &entry, &elen, &value)) {
            printf("Entry: ");
            if (entry) {
                if (elen && fwrite(entry,elen,1,stdout) == 0) perror("fwrite");
            } else {
                printf("%lld", value);
            }
            p = ziplistNext(zl,p);
            printf("\n");
        }
        printf("\n");
        dfree(zl);
    }

    printf("Iterate list from 2 to end:\n");
    {
        zl = createList();
        p = ziplistIndex(zl, 2);
        while (ziplistGet(p, &entry, &elen, &value)) {
            printf("Entry: ");
            if (entry) {
                if (elen && fwrite(entry,elen,1,stdout) == 0) perror("fwrite");
            } else {
                printf("%lld", value);
            }
            p = ziplistNext(zl,p);
            printf("\n");
        }
        printf("\n");
        dfree(zl);
    }

    printf("Iterate starting out of range:\n");
    {
        zl = createList();
        p = ziplistIndex(zl, 4);
        if (!ziplistGet(p, &entry, &elen, &value)) {
            printf("No entry\n");
        } else {
            printf("ERROR\n");
        }
        printf("\n");
        dfree(zl);
    }

    printf("Iterate from back to front:\n");
    {
        zl = createList();
        p = ziplistIndex(zl, -1);
        while (ziplistGet(p, &entry, &elen, &value)) {
            printf("Entry: ");
            if (entry) {
                if (elen && fwrite(entry,elen,1,stdout) == 0) perror("fwrite");
            } else {
                printf("%lld", value);
            }
            p = ziplistPrev(zl,p);
            printf("\n");
        }
        printf("\n");
        dfree(zl);
    }

    printf("Iterate from back to front, deleting all items:\n");
    {
        zl = createList();
        p = ziplistIndex(zl, -1);
        while (ziplistGet(p, &entry, &elen, &value)) {
            printf("Entry: ");
            if (entry) {
                if (elen && fwrite(entry,elen,1,stdout) == 0) perror("fwrite");
            } else {
                printf("%lld", value);
            }
            zl = ziplistDelete(zl,&p);
            p = ziplistPrev(zl,p);
            printf("\n");
        }
        printf("\n");
        dfree(zl);
    }

    printf("Delete inclusive range 0,0:\n");
    {
        zl = createList();
        zl = ziplistDeleteRange(zl, 0, 1);
        ziplistRepr(zl);
        dfree(zl);
    }

    printf("Delete inclusive range 0,1:\n");
    {
        zl = createList();
        zl = ziplistDeleteRange(zl, 0, 2);
        ziplistRepr(zl);
        dfree(zl);
    }

    printf("Delete inclusive range 1,2:\n");
    {
        zl = createList();
        zl = ziplistDeleteRange(zl, 1, 2);
        ziplistRepr(zl);
        dfree(zl);
    }

    printf("Delete with start index out of range:\n");
    {
        zl = createList();
        zl = ziplistDeleteRange(zl, 5, 1);
        ziplistRepr(zl);
        dfree(zl);
    }

    printf("Delete with num overflow:\n");
    {
        zl = createList();
        zl = ziplistDeleteRange(zl, 1, 5);
        ziplistRepr(zl);
        dfree(zl);
    }

    printf("Delete foo while iterating:\n");
    {
        zl = createList();
        p = ziplistIndex(zl,0);
        while (ziplistGet(p,&entry,&elen,&value)) {
            if (entry && strncmp("foo",(char*)entry,elen) == 0) {
                printf("Delete foo\n");
                zl = ziplistDelete(zl,&p);
            } else {
                printf("Entry: ");
                if (entry) {
                    if (elen && fwrite(entry,elen,1,stdout) == 0)
                        perror("fwrite");
                } else {
                    printf("%lld",value);
                }
                p = ziplistNext(zl,p);
                printf("\n");
            }
        }
        printf("\n");
        ziplistRepr(zl);
        dfree(zl);
    }

    printf("Regression test for >255 byte strings:\n");
    {
        char v1[257] = {0}, v2[257] = {0};
        memset(v1,'x',256);
        memset(v2,'y',256);
        zl = ziplistNew();
        zl = ziplistPush(zl,(unsigned char*)v1,strlen(v1),ZIPLIST_TAIL);
        zl = ziplistPush(zl,(unsigned char*)v2,strlen(v2),ZIPLIST_TAIL);

        /* Pop values again and compare their value. */
        p = ziplistIndex(zl,0);
        ret = (int)ziplistGet(p,&entry,&elen,&value);
        ASSERT(ret > 0);
        ASSERT(strncmp(v1,(char*)entry,elen) == 0);
        p = ziplistIndex(zl,1);
        ret = (int)ziplistGet(p,&entry,&elen,&value);
        ASSERT(ret > 0);
        ASSERT(strncmp(v2,(char*)entry,elen) == 0);
        printf("SUCCESS\n\n");
        dfree(zl);
    }

    printf("Regression test deleting next to last entries:\n");
    {
        char v[3][257] = {{0}};
        zlentry e[3] = {{.prevrawlensize = 0, .prevrawlen = 0, .lensize = 0,
                         .len = 0, .headersize = 0, .encoding = 0, .p = NULL}};
        size_t i;

        for (i = 0; i < (sizeof(v)/sizeof(v[0])); i++) {
            memset(v[i], 'a' + i, sizeof(v[0]));
        }

        v[0][256] = '\0';
        v[1][  1] = '\0';
        v[2][256] = '\0';

        zl = ziplistNew();
        for (i = 0; i < (sizeof(v)/sizeof(v[0])); i++) {
            zl = ziplistPush(zl, (unsigned char *) v[i], strlen(v[i]), ZIPLIST_TAIL);
        }

        verify(zl, e);

        ASSERT(e[0].prevrawlensize == 1);
        ASSERT(e[1].prevrawlensize == 5);
        ASSERT(e[2].prevrawlensize == 1);

        /* Deleting entry 1 will increase `prevrawlensize` for entry 2 */
        unsigned char *p = e[1].p;
        zl = ziplistDelete(zl, &p);

        verify(zl, e);

        ASSERT(e[0].prevrawlensize == 1);
        ASSERT(e[1].prevrawlensize == 5);

        printf("SUCCESS\n\n");
        dfree(zl);
    }

    printf("Create long list and check indices:\n");
    {
        zl = ziplistNew();
        char buf[32];
        int i,len;
        for (i = 0; i < 1000; i++) {
            len = sprintf(buf,"%d",i);
            zl = ziplistPush(zl,(unsigned char*)buf,len,ZIPLIST_TAIL);
        }
        for (i = 0; i < 1000; i++) {
            p = ziplistIndex(zl,i);
            ret = (int)ziplistGet(p,NULL,NULL,&value);
            ASSERT(ret > 0);
            ASSERT(i == value);

            p = ziplistIndex(zl,-i-1);
            ret = (int)ziplistGet(p,NULL,NULL,&value);
            ASSERT(ret > 0);
            ASSERT(999-i == value);
        }
        printf("SUCCESS\n\n");
        dfree(zl);
    }

    printf("Compare strings with ziplist entries:\n");
    {
        zl = createList();
        p = ziplistIndex(zl,0);
        if (!ziplistCompare(p,(unsigned char*)"hello",5)) {
            printf("ERROR: not \"hello\"\n");
            return 1;
        }
        if (ziplistCompare(p,(unsigned char*)"hella",5)) {
            printf("ERROR: \"hella\"\n");
            return 1;
        }

        p = ziplistIndex(zl,3);
        if (!ziplistCompare(p,(unsigned char*)"1024",4)) {
            printf("ERROR: not \"1024\"\n");
            return 1;
        }
        if (ziplistCompare(p,(unsigned char*)"1025",4)) {
            printf("ERROR: \"1025\"\n");
            return 1;
        }
        printf("SUCCESS\n\n");
        dfree(zl);
    }

    printf("Merge test:\n");
    {
        /* create list gives us: [hello, foo, quux, 1024] */
        zl = createList();
        unsigned char *zl2 = createList();

        unsigned char *zl3 = ziplistNew();
        unsigned char *zl4 = ziplistNew();

        if (ziplistMerge(&zl4, &zl4)) {
            printf("ERROR: Allowed merging of one ziplist into itself.\n");
            return 1;
        }

        /* Merge two empty ziplists, get empty result back. */
        zl4 = ziplistMerge(&zl3, &zl4);
        ziplistRepr(zl4);
        if (ziplistLen(zl4)) {
            printf("ERROR: Merging two empty ziplists created entries.\n");
            return 1;
        }
        dfree(zl4);

        zl2 = ziplistMerge(&zl, &zl2);
        /* merge gives us: [hello, foo, quux, 1024, hello, foo, quux, 1024] */
        ziplistRepr(zl2);

        if (ziplistLen(zl2) != 8) {
            printf("ERROR: Merged length not 8, but: %u\n", ziplistLen(zl2));
            return 1;
        }

        p = ziplistIndex(zl2,0);
        if (!ziplistCompare(p,(unsigned char*)"hello",5)) {
            printf("ERROR: not \"hello\"\n");
            return 1;
        }
        if (ziplistCompare(p,(unsigned char*)"hella",5)) {
            printf("ERROR: \"hella\"\n");
            return 1;
        }

        p = ziplistIndex(zl2,3);
        if (!ziplistCompare(p,(unsigned char*)"1024",4)) {
            printf("ERROR: not \"1024\"\n");
            return 1;
        }
        if (ziplistCompare(p,(unsigned char*)"1025",4)) {
            printf("ERROR: \"1025\"\n");
            return 1;
        }

        p = ziplistIndex(zl2,4);
        if (!ziplistCompare(p,(unsigned char*)"hello",5)) {
            printf("ERROR: not \"hello\"\n");
            return 1;
        }
        if (ziplistCompare(p,(unsigned char*)"hella",5)) {
            printf("ERROR: \"hella\"\n");
            return 1;
        }

        p = ziplistIndex(zl2,7);
        if (!ziplistCompare(p,(unsigned char*)"1024",4)) {
            printf("ERROR: not \"1024\"\n");
            return 1;
        }
        if (ziplistCompare(p,(unsigned char*)"1025",4)) {
            printf("ERROR: \"1025\"\n");
            return 1;
        }
        printf("SUCCESS\n\n");
        dfree(zl);
    }

    printf("Stress with random payloads of different encoding:\n");
    {
        int i,j,len,where;
        unsigned char *p;
        char buf[1024];
        int buflen;
        dlist *ref;
        dlistNode *refnode;

        /* Hold temp vars from ziplist */
        unsigned char *sstr;
        unsigned int slen;
        long long sval;

        for (i = 0; i < 20000; i++) {
            zl = ziplistNew();
            ref = dlistCreate();
            dlistSetFreeMethod(ref,(void (*)(void*))sdsfree);
            len = rand() % 256;

            /* Create lists */
            for (j = 0; j < len; j++) {
                where = (rand() & 1) ? ZIPLIST_HEAD : ZIPLIST_TAIL;
                if (rand() % 2) {
                    buflen = randstring(buf,1,sizeof(buf)-1);
                } else {
                    switch(rand() % 3) {
                    case 0:
                        buflen = sprintf(buf,"%lld",(0LL + rand()) >> 20);
                        break;
                    case 1:
                        buflen = sprintf(buf,"%lld",(0LL + rand()));
                        break;
                    case 2:
                        buflen = sprintf(buf,"%lld",(0LL + rand()) << 20);
                        break;
                    default:
                        ASSERT(NULL);
                    }
                }

                /* Add to ziplist */
                zl = ziplistPush(zl, (unsigned char*)buf, buflen, where);

                /* Add to reference list */
                if (where == ZIPLIST_HEAD) {
                    dlistAddNodeHead(ref,sdsnewlen(buf, buflen));
                } else if (where == ZIPLIST_TAIL) {
                    dlistAddNodeTail(ref,sdsnewlen(buf, buflen));
                } else {
                    ASSERT(NULL);
                }
            }

            ASSERT(dlistLength(ref) == ziplistLen(zl));
            for (j = 0; j < len; j++) {
                /* Naive way to get elements, but similar to the stresser
                 * executed from the Tcl test suite. */
                p = ziplistIndex(zl,j);
                refnode = dlistIndex(ref,j);

                ret = (int)ziplistGet(p,&sstr,&slen,&sval);
                ASSERT(ret > 0);
                if (sstr == NULL) {
                    buflen = sprintf(buf,"%lld",sval);
                } else {
                    buflen = slen;
                    memcpy(buf,sstr,buflen);
                    buf[buflen] = '\0';
                }
                ASSERT(memcmp(buf,dlistNodeValue(refnode),buflen) == 0);
            }
            dfree(zl);
            dlistRelease(ref);
        }
        printf("SUCCESS\n\n");
    }

    printf("Stress with variable ziplist size:\n");
    {
        stress(ZIPLIST_HEAD,100000,16384,256);
        stress(ZIPLIST_TAIL,100000,16384,256);
    }

    return 0;
}
#endif


================================================
FILE: src/vr_ziplist.h
================================================
#ifndef _ZIPLIST_H
#define _ZIPLIST_H

#define ZIPLIST_HEAD 0
#define ZIPLIST_TAIL 1

unsigned char *ziplistNew(void);
unsigned char *ziplistMerge(unsigned char **first, unsigned char **second);
unsigned char *ziplistPush(unsigned char *zl, unsigned char *s, unsigned int slen, int where);
unsigned char *ziplistIndex(unsigned char *zl, int index);
unsigned char *ziplistNext(unsigned char *zl, unsigned char *p);
unsigned char *ziplistPrev(unsigned char *zl, unsigned char *p);
unsigned int ziplistGet(unsigned char *p, unsigned char **sval, unsigned int *slen, long long *lval);
unsigned char *ziplistInsert(unsigned char *zl, unsigned char *p, unsigned char *s, unsigned int slen);
unsigned char *ziplistDelete(unsigned char *zl, unsigned char **p);
unsigned char *ziplistDeleteRange(unsigned char *zl, int index, unsigned int num);
unsigned int ziplistCompare(unsigned char *p, unsigned char *s, unsigned int slen);
unsigned char *ziplistFind(unsigned char *p, unsigned char *vstr, unsigned int vlen, unsigned int skip);
unsigned int ziplistLen(unsigned char *zl);
size_t ziplistBlobLen(unsigned char *zl);

#ifdef REDIS_TEST
int ziplistTest(int argc, char *argv[]);
#endif

#endif /* _ZIPLIST_H */


================================================
FILE: src/vr_zipmap.c
================================================
/* String -> String Map data structure optimized for size.
 * This file implements a data structure mapping strings to other strings
 * implementing an O(n) lookup data structure designed to be very memory
 * efficient.
 *
 * The Redis Hash type uses this data structure for hashes composed of a small
 * number of elements, to switch to a hash table once a given number of
 * elements is reached.
 *
 * Given that many times Redis Hashes are used to represent objects composed
 * of few fields, this is a very big win in terms of used memory.
 *
 * --------------------------------------------------------------------------
 *
 * Copyright (c) 2009-2010, Salvatore Sanfilippo <antirez at gmail dot com>
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 *   * Redistributions of source code must retain the above copyright notice,
 *     this list of conditions and the following disclaimer.
 *   * Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *   * Neither the name of Redis nor the names of its contributors may be used
 *     to endorse or promote products derived from this software without
 *     specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

/* Memory layout of a zipmap, for the map "foo" => "bar", "hello" => "world":
 *
 * <zmlen><len>"foo"<len><free>"bar"<len>"hello"<len><free>"world"
 *
 * <zmlen> is 1 byte length that holds the current size of the zipmap.
 * When the zipmap length is greater than or equal to 254, this value
 * is not used and the zipmap needs to be traversed to find out the length.
 *
 * <len> is the length of the following string (key or value).
 * <len> lengths are encoded in a single value or in a 5 bytes value.
 * If the first byte value (as an unsigned 8 bit value) is between 0 and
 * 253, it's a single-byte length. If it is 254 then a four bytes unsigned
 * integer follows (in the host byte ordering). A value of 255 is used to
 * signal the end of the hash.
 *
 * <free> is the number of free unused bytes after the string, resulting
 * from modification of values associated to a key. For instance if "foo"
 * is set to "bar", and later "foo" will be set to "hi", it will have a
 * free byte to use if the value will enlarge again later, or even in
 * order to add a key/value pair if it fits.
 *
 * <free> is always an unsigned 8 bit number, because if after an
 * update operation there are more than a few free bytes, the zipmap will be
 * reallocated to make sure it is as small as possible.
 *
 * The most compact representation of the above two elements hash is actually:
 *
 * "\x02\x03foo\x03\x00bar\x05hello\x05\x00world\xff"
 *
 * Note that because keys and values are prefixed length "objects",
 * the lookup will take O(N) where N is the number of elements
 * in the zipmap and *not* the number of bytes needed to represent the zipmap.
 * This lowers the constant times considerably.
 */

#include <stdio.h>
#include <string.h>

#include <vr_core.h>

#define ZIPMAP_BIGLEN 254
#define ZIPMAP_END 255

/* The following defines the max value for the <free> field described in the
 * comments above, that is, the max number of trailing bytes in a value. */
#define ZIPMAP_VALUE_MAX_FREE 4

/* The following macro returns the number of bytes needed to encode the length
 * for the integer value _l, that is, 1 byte for lengths < ZIPMAP_BIGLEN and
 * 5 bytes for all the other lengths. */
#define ZIPMAP_LEN_BYTES(_l) (((_l) < ZIPMAP_BIGLEN) ? 1 : sizeof(unsigned int)+1)

/* Create a new empty zipmap. */
unsigned char *zipmapNew(void) {
    unsigned char *zm = dalloc(2);

    zm[0] = 0; /* Length */
    zm[1] = ZIPMAP_END;
    return zm;
}

/* Decode the encoded length pointed by 'p' */
static unsigned int zipmapDecodeLength(unsigned char *p) {
    unsigned int len = *p;

    if (len < ZIPMAP_BIGLEN) return len;
    memcpy(&len,p+1,sizeof(unsigned int));
    memrev32ifbe(&len);
    return len;
}

/* Encode the length 'l' writing it in 'p'. If p is NULL it just returns
 * the amount of bytes required to encode such a length. */
static unsigned int zipmapEncodeLength(unsigned char *p, unsigned int len) {
    if (p == NULL) {
        return ZIPMAP_LEN_BYTES(len);
    } else {
        if (len < ZIPMAP_BIGLEN) {
            p[0] = len;
            return 1;
        } else {
            p[0] = ZIPMAP_BIGLEN;
            memcpy(p+1,&len,sizeof(len));
            memrev32ifbe(p+1);
            return 1+sizeof(len);
        }
    }
}

/* Search for a matching key, returning a pointer to the entry inside the
 * zipmap. Returns NULL if the key is not found.
 *
 * If NULL is returned, and totlen is not NULL, it is set to the entire
 * size of the zimap, so that the calling function will be able to
 * reallocate the original zipmap to make room for more entries. */
static unsigned char *zipmapLookupRaw(unsigned char *zm, unsigned char *key, unsigned int klen, unsigned int *totlen) {
    unsigned char *p = zm+1, *k = NULL;
    unsigned int l,llen;

    while(*p != ZIPMAP_END) {
        unsigned char free;

        /* Match or skip the key */
        l = zipmapDecodeLength(p);
        llen = zipmapEncodeLength(NULL,l);
        if (key != NULL && k == NULL && l == klen && !memcmp(p+llen,key,l)) {
            /* Only return when the user doesn't care
             * for the total length of the zipmap. */
            if (totlen != NULL) {
                k = p;
            } else {
                return p;
            }
        }
        p += llen+l;
        /* Skip the value as well */
        l = zipmapDecodeLength(p);
        p += zipmapEncodeLength(NULL,l);
        free = p[0];
        p += l+1+free; /* +1 to skip the free byte */
    }
    if (totlen != NULL) *totlen = (unsigned int)(p-zm)+1;
    return k;
}

static unsigned long zipmapRequiredLength(unsigned int klen, unsigned int vlen) {
    unsigned int l;

    l = klen+vlen+3;
    if (klen >= ZIPMAP_BIGLEN) l += 4;
    if (vlen >= ZIPMAP_BIGLEN) l += 4;
    return l;
}

/* Return the total amount used by a key (encoded length + payload) */
static unsigned int zipmapRawKeyLength(unsigned char *p) {
    unsigned int l = zipmapDecodeLength(p);
    return zipmapEncodeLength(NULL,l) + l;
}

/* Return the total amount used by a value
 * (encoded length + single byte free count + payload) */
static unsigned int zipmapRawValueLength(unsigned char *p) {
    unsigned int l = zipmapDecodeLength(p);
    unsigned int used;

    used = zipmapEncodeLength(NULL,l);
    used += p[used] + 1 + l;
    return used;
}

/* If 'p' points to a key, this function returns the total amount of
 * bytes used to store this entry (entry = key + associated value + trailing
 * free space if any). */
static unsigned int zipmapRawEntryLength(unsigned char *p) {
    unsigned int l = zipmapRawKeyLength(p);
    return l + zipmapRawValueLength(p+l);
}

static inline unsigned char *zipmapResize(unsigned char *zm, unsigned int len) {
    zm = drealloc(zm, len);
    zm[len-1] = ZIPMAP_END;
    return zm;
}

/* Set key to value, creating the key if it does not already exist.
 * If 'update' is not NULL, *update is set to 1 if the key was
 * already preset, otherwise to 0. */
unsigned char *zipmapSet(unsigned char *zm, unsigned char *key, unsigned int klen, unsigned char *val, unsigned int vlen, int *update) {
    unsigned int zmlen, offset;
    unsigned int freelen, reqlen = zipmapRequiredLength(klen,vlen);
    unsigned int empty, vempty;
    unsigned char *p;

    freelen = reqlen;
    if (update) *update = 0;
    p = zipmapLookupRaw(zm,key,klen,&zmlen);
    if (p == NULL) {
        /* Key not found: enlarge */
        zm = zipmapResize(zm, zmlen+reqlen);
        p = zm+zmlen-1;
        zmlen = zmlen+reqlen;

        /* Increase zipmap length (this is an insert) */
        if (zm[0] < ZIPMAP_BIGLEN) zm[0]++;
    } else {
        /* Key found. Is there enough space for the new value? */
        /* Compute the total length: */
        if (update) *update = 1;
        freelen = zipmapRawEntryLength(p);
        if (freelen < reqlen) {
            /* Store the offset of this key within the current zipmap, so
             * it can be resized. Then, move the tail backwards so this
             * pair fits at the current position. */
            offset = p-zm;
            zm = zipmapResize(zm, zmlen-freelen+reqlen);
            p = zm+offset;

            /* The +1 in the number of bytes to be moved is caused by the
             * end-of-zipmap byte. Note: the *original* zmlen is used. */
            memmove(p+reqlen, p+freelen, zmlen-(offset+freelen+1));
            zmlen = zmlen-freelen+reqlen;
            freelen = reqlen;
        }
    }

    /* We now have a suitable block where the key/value entry can
     * be written. If there is too much free space, move the tail
     * of the zipmap a few bytes to the front and shrink the zipmap,
     * as we want zipmaps to be very space efficient. */
    empty = freelen-reqlen;
    if (empty >= ZIPMAP_VALUE_MAX_FREE) {
        /* First, move the tail <empty> bytes to the front, then resize
         * the zipmap to be <empty> bytes smaller. */
        offset = p-zm;
        memmove(p+reqlen, p+freelen, zmlen-(offset+freelen+1));
        zmlen -= empty;
        zm = zipmapResize(zm, zmlen);
        p = zm+offset;
        vempty = 0;
    } else {
        vempty = empty;
    }

    /* Just write the key + value and we are done. */
    /* Key: */
    p += zipmapEncodeLength(p,klen);
    memcpy(p,key,klen);
    p += klen;
    /* Value: */
    p += zipmapEncodeLength(p,vlen);
    *p++ = vempty;
    memcpy(p,val,vlen);
    return zm;
}

/* Remove the specified key. If 'deleted' is not NULL the pointed integer is
 * set to 0 if the key was not found, to 1 if it was found and deleted. */
unsigned char *zipmapDel(unsigned char *zm, unsigned char *key, unsigned int klen, int *deleted) {
    unsigned int zmlen, freelen;
    unsigned char *p = zipmapLookupRaw(zm,key,klen,&zmlen);
    if (p) {
        freelen = zipmapRawEntryLength(p);
        memmove(p, p+freelen, zmlen-((p-zm)+freelen+1));
        zm = zipmapResize(zm, zmlen-freelen);

        /* Decrease zipmap length */
        if (zm[0] < ZIPMAP_BIGLEN) zm[0]--;

        if (deleted) *deleted = 1;
    } else {
        if (deleted) *deleted = 0;
    }
    return zm;
}

/* Call before iterating through elements via zipmapNext() */
unsigned char *zipmapRewind(unsigned char *zm) {
    return zm+1;
}

/* This function is used to iterate through all the zipmap elements.
 * In the first call the first argument is the pointer to the zipmap + 1.
 * In the next calls what zipmapNext returns is used as first argument.
 * Example:
 *
 * unsigned char *i = zipmapRewind(my_zipmap);
 * while((i = zipmapNext(i,&key,&klen,&value,&vlen)) != NULL) {
 *     printf("%d bytes key at $p\n", klen, key);
 *     printf("%d bytes value at $p\n", vlen, value);
 * }
 */
unsigned char *zipmapNext(unsigned char *zm, unsigned char **key, unsigned int *klen, unsigned char **value, unsigned int *vlen) {
    if (zm[0] == ZIPMAP_END) return NULL;
    if (key) {
        *key = zm;
        *klen = zipmapDecodeLength(zm);
        *key += ZIPMAP_LEN_BYTES(*klen);
    }
    zm += zipmapRawKeyLength(zm);
    if (value) {
        *value = zm+1;
        *vlen = zipmapDecodeLength(zm);
        *value += ZIPMAP_LEN_BYTES(*vlen);
    }
    zm += zipmapRawValueLength(zm);
    return zm;
}

/* Search a key and retrieve the pointer and len of the associated value.
 * If the key is found the function returns 1, otherwise 0. */
int zipmapGet(unsigned char *zm, unsigned char *key, unsigned int klen, unsigned char **value, unsigned int *vlen) {
    unsigned char *p;

    if ((p = zipmapLookupRaw(zm,key,klen,NULL)) == NULL) return 0;
    p += zipmapRawKeyLength(p);
    *vlen = zipmapDecodeLength(p);
    *value = p + ZIPMAP_LEN_BYTES(*vlen) + 1;
    return 1;
}

/* Return 1 if the key exists, otherwise 0 is returned. */
int zipmapExists(unsigned char *zm, unsigned char *key, unsigned int klen) {
    return zipmapLookupRaw(zm,key,klen,NULL) != NULL;
}

/* Return the number of entries inside a zipmap */
unsigned int zipmapLen(unsigned char *zm) {
    unsigned int len = 0;
    if (zm[0] < ZIPMAP_BIGLEN) {
        len = zm[0];
    } else {
        unsigned char *p = zipmapRewind(zm);
        while((p = zipmapNext(p,NULL,NULL,NULL,NULL)) != NULL) len++;

        /* Re-store length if small enough */
        if (len < ZIPMAP_BIGLEN) zm[0] = len;
    }
    return len;
}

/* Return the raw size in bytes of a zipmap, so that we can serialize
 * the zipmap on disk (or everywhere is needed) just writing the returned
 * amount of bytes of the C array starting at the zipmap pointer. */
size_t zipmapBlobLen(unsigned char *zm) {
    unsigned int totlen;
    zipmapLookupRaw(zm,NULL,0,&totlen);
    return totlen;
}


================================================
FILE: src/vr_zipmap.h
================================================
#ifndef _ZIPMAP_H
#define _ZIPMAP_H

unsigned char *zipmapNew(void);
unsigned char *zipmapSet(unsigned char *zm, unsigned char *key, unsigned int klen, unsigned char *val, unsigned int vlen, int *update);
unsigned char *zipmapDel(unsigned char *zm, unsigned char *key, unsigned int klen, int *deleted);
unsigned char *zipmapRewind(unsigned char *zm);
unsigned char *zipmapNext(unsigned char *zm, unsigned char **key, unsigned int *klen, unsigned char **value, unsigned int *vlen);
int zipmapGet(unsigned char *zm, unsigned char *key, unsigned int klen, unsigned char **value, unsigned int *vlen);
int zipmapExists(unsigned char *zm, unsigned char *key, unsigned int klen);
unsigned int zipmapLen(unsigned char *zm);
size_t zipmapBlobLen(unsigned char *zm);
void zipmapRepr(unsigned char *p);

#endif


================================================
FILE: tests/.gitignore
================================================
*.pyc
*.out
*.log

================================================
FILE: tests/Makefile.am
================================================
MAINTAINERCLEANFILES = Makefile.in

AM_CPPFLAGS =
if !OS_SOLARIS
AM_CPPFLAGS += -D_GNU_SOURCE
endif
AM_CPPFLAGS += -I $(top_srcdir)/dep/ae
AM_CPPFLAGS += -I $(top_srcdir)/dep/jemalloc-4.2.0/include
AM_CPPFLAGS += -I $(top_srcdir)/dep/hiredis-0.13.3
AM_CPPFLAGS += -I $(top_srcdir)/dep/dhashkit
AM_CPPFLAGS += -I $(top_srcdir)/dep/dlist
AM_CPPFLAGS += -I $(top_srcdir)/dep/darray
AM_CPPFLAGS += -I $(top_srcdir)/dep/util
AM_CPPFLAGS += -I $(top_srcdir)/dep/himemcached-0.1.0

AM_CFLAGS = 
AM_CFLAGS += -fno-strict-aliasing
AM_CFLAGS += -Wall -Wshadow
AM_CFLAGS += -Wpointer-arith
AM_CFLAGS += -Winline
AM_CFLAGS += -Wunused-function -Wunused-variable -Wunused-value
AM_CFLAGS += -Wno-unused-parameter -Wno-unused-value
AM_CFLAGS += -Wconversion -Wsign-compare
AM_CFLAGS += -Wstrict-prototypes -Wmissing-prototypes -Wredundant-decls -Wmissing-declarations

AM_LDFLAGS =
AM_LDFLAGS += -lm -lpthread -rdynamic
if !OS_DARWIN
AM_LDFLAGS += -lrt
endif
if OS_SOLARIS
AM_LDFLAGS += -lnsl -lsocket
endif
if OS_FREEBSD
AM_LDFLAGS += -lexecinfo
endif

noinst_PROGRAMS = viretest

viretest_SOURCES =                      \
    vrt_util.c vrt_util.h               \
    vrt_public.c vrt_public.h           \
    vrt_simple.c vrt_simple.h           \
    vrtest.c
    
viretest_LDADD = $(top_builddir)/dep/ae/libae.a
viretest_LDADD += $(top_builddir)/dep/hiredis-0.13.3/libhiredis.a
viretest_LDADD += $(top_builddir)/dep/darray/libdarray.a
viretest_LDADD += $(top_builddir)/dep/dmalloc/libdmalloc.a
viretest_LDADD += $(top_builddir)/dep/util/libdutil.a
viretest_LDADD += $(top_builddir)/dep/jemalloc-4.2.0/lib/libjemalloc.a

noinst_PROGRAMS += vireabtest

vireabtest_SOURCES =                        \
    vrt_util.c vrt_util.h                   \
    vrt_public.c vrt_public.h               \
    vrt_produce_data.c vrt_produce_data.h   \
    vrt_dispatch_data.c vrt_dispatch_data.h \
    vrt_check_data.c vrt_check_data.h       \
    vrt_backend.c vrt_backend.h             \
    vrabtest.c vrabtest.h
    
vireabtest_LDADD = $(top_builddir)/dep/ae/libae.a
vireabtest_LDADD += $(top_builddir)/dep/hiredis-0.13.3/libhiredis.a
vireabtest_LDADD += $(top_builddir)/dep/dhashkit/libdhashkit.a
vireabtest_LDADD += $(top_builddir)/dep/dlist/libdlist.a
vireabtest_LDADD += $(top_builddir)/dep/darray/libdarray.a
vireabtest_LDADD += $(top_builddir)/dep/dmalloc/libdmalloc.a
vireabtest_LDADD += $(top_builddir)/dep/util/libdutil.a
vireabtest_LDADD += $(top_builddir)/dep/jemalloc-4.2.0/lib/libjemalloc.a

noinst_PROGRAMS += vire-benchmark

vire_benchmark_SOURCES =                    \
    vrt_util.c vrt_util.h                   \
    vrt_public.c vrt_public.h               \
    vrt_benchmark.c
    
vire_benchmark_LDADD = $(top_builddir)/dep/ae/libae.a
vire_benchmark_LDADD += $(top_builddir)/dep/hiredis-0.13.3/libhiredis.a
vire_benchmark_LDADD += $(top_builddir)/dep/himemcached-0.1.0/libhimemcached.a
vire_benchmark_LDADD += $(top_builddir)/dep/dlist/libdlist.a
vire_benchmark_LDADD += $(top_builddir)/dep/darray/libdarray.a
vire_benchmark_LDADD += $(top_builddir)/dep/dmalloc/libdmalloc.a
vire_benchmark_LDADD += $(top_builddir)/dep/util/libdutil.a
vire_benchmark_LDADD += $(top_builddir)/dep/jemalloc-4.2.0/lib/libjemalloc.a

================================================
FILE: tests/vrabtest.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <getopt.h>
#include <fcntl.h>
#include <errno.h>
#include <signal.h>
#include <assert.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <hiredis.h>
#include <darray.h>
#include <dlog.h>

#include <vrt_util.h>
#include <vrt_public.h>
#include <vrt_produce_data.h>
#include <vrt_dispatch_data.h>
#include <vrt_check_data.h>
#include <vrt_backend.h>
#include <vrabtest.h>

#define CONFIG_DEFAULT_PIDFILE                      NULL
#define CONFIG_DEFAULT_CHECKER                      "myself"
#define CONFIG_DEFAULT_TEST_INTERVAL                3600
#define CONFIG_DEFAULT_KEY_LENGTH_RANGE_BEGIN       0
#define CONFIG_DEFAULT_KEY_LENGTH_RANGE_END         100
#define CONFIG_DEFAULT_STRING_MAX_LENGTH            512
#define CONFIG_DEFAULT_FIELDS_MAX_COUNT             16
#define CONFIG_DEFAULT_TEST_TARGET                  ""
#define CONFIG_DEFAULT_PRODUCE_THREADS_COUNT        1
#define CONFIG_DEFAULT_CACHED_KEYS_COUNT            10000
#define CONFIG_DEFAULT_HIT_RATIO                    75
#define CONFIG_DEFAULT_DISPATCH_THREADS_COUNT       1
#define CONFIG_DEFAULT_CLIENTS_PER_DISPATCH_THREAD  10
#define CONFIG_DEFAULT_LOGFILE                      NULL

#define VRABTEST_GROUP_TYPE_REDIS   0
#define VRABTEST_GROUP_TYPE_VIRE    1

struct config {
    char *checker;
    long long test_interval;
    int key_length_range_begin;
    int key_length_range_end;
    int string_max_length;
    int fields_max_count;
    int cmd_type;
    darray *cmd_blacklist;
    darray *cmd_whitelist;
    char *test_targets; 
    int produce_data_threads;
    long long cached_keys_per_produce_thread;
    int hit_ratio;
    int dispatch_data_threads;
    int clients_per_dispatch_thread;
    char *pid_filename;
    char *log_filename;
};

static struct config config;

static int show_help;
static int show_version;
static int daemonize;

/* 0 or 1
 * 1: used the expire,expireat,pexpire and pexpireat commands
 * 0 is the opposite. */
int expire_enabled;

/* Interval time for test data dispatched to test targets. 
 * Unit is second */
long long test_interval;

/* Last begin time to test the data.
 * Unit is second */
long long last_test_begin_time;

static struct option long_options[] = {
    { "help",                   no_argument,        NULL,   'h' },
    { "version",                no_argument,        NULL,   'V' },
    { "daemonize",              no_argument,        NULL,   'D' },
    { "enable-expire",          no_argument,        NULL,   'E' },
    { "pid-file",               required_argument,  NULL,   'P' },
    { "checker",                required_argument,  NULL,   'C' },
    { "test-interval",          required_argument,  NULL,   'i' },
    { "key-length-range",       required_argument,  NULL,   'k' },
    { "string-max-length",      required_argument,  NULL,   's' },
    { "fields-max-count",       required_argument,  NULL,   'f' },
    { "command-types",          required_argument,  NULL,   'T' },
    { "command-black-list",     required_argument,  NULL,   'B' },
    { "command-white-list",     required_argument,  NULL,   'W' },
    { "test-targets",           required_argument,  NULL,   't' },
    { "produce-data-threads",   required_argument,  NULL,   'p' },
    { "cached-keys",            required_argument,  NULL,   'K' },
    { "hit-ratio",              required_argument,  NULL,   'H' },
    { "dispatch-data-threads",  required_argument,  NULL,   'd' },
    { "clients",                required_argument,  NULL,   'c' },
    { "log-file",               required_argument,  NULL,   'o' },
    { NULL,                     0,                  NULL,    0  }
};

static char short_options[] = "hVDEP:C:i:k:s:f:T:B:W:t:p:K:H:d:c:o:";

static void
vrt_show_usage(void)
{
    printf(
        "Usage: vireabtest [-?hVDE]" CRLF
        "" CRLF);
    printf(
        "Options:" CRLF
        "  -h, --help                   : this help" CRLF
        "  -V, --version                : show version and exit" CRLF
        "  -D, --daemonize              : run as a daemon" CRLF
        "  -E, --enable-expire          : enable the expire" CRLF);
    printf(
        "  -P, --pid-file               : pid file" CRLF
        "  -C, --checker                : the checker to check data consistency" CRLF
        "  -i, --test-interval          : the interval for checking data consistency, unit is second" CRLF
        "  -k, --key-length-range       : the key length range to generate for test, like 0-100" CRLF
        "  -s, --string-max-length      : the max string length to generate for test, string is for STRING/LIST... value element" CRLF
        "  -f, --fields-max-count       : the max fields count to generate for test, field is the LIST/HASH...'s element" CRLF
        "  -T, --command-types          : the command types to generate for test, like string,hash,key" CRLF
        "  -B, --command-black-list     : the commands not want to test, like del,lrange,mget" CRLF
        "  -W, --command-white-list     : the commands only allows to test, like del,lrange,mget" CRLF
        "  -t, --test-targets           : the test targets for test, like vire[127.0.0.1:12301]-redis[127.0.0.1:12311]" CRLF
        "  -p, --produce-data-threads   : the threads count to produce test data" CRLF
        "  -K, --cached-keys            : the cached keys count for every produce data thread" CRLF
        "  -H, --hit-ratio              : the hit ratio for readonly commands, between 0 and 100" CRLF
        "  -d, --dispatch-data-threads  : the threads count to dispatch test data to target groups" CRLF
        "  -c, --clients                : the clients count for every dispatch data thread" CRLF
        "  -o, --log-file               : set logging file (default: %s)" CRLF
        "", 
        CONFIG_DEFAULT_LOGFILE != NULL ? CONFIG_DEFAULT_LOGFILE : "stderr");
}

static void
vrt_set_default_options(void)
{
    config.pid_filename = CONFIG_DEFAULT_PIDFILE;
    config.checker = CONFIG_DEFAULT_CHECKER;
    config.test_interval = CONFIG_DEFAULT_TEST_INTERVAL;
    config.key_length_range_begin = CONFIG_DEFAULT_KEY_LENGTH_RANGE_BEGIN;
    config.key_length_range_end = CONFIG_DEFAULT_KEY_LENGTH_RANGE_END;
    config.string_max_length = CONFIG_DEFAULT_STRING_MAX_LENGTH;
    config.fields_max_count = CONFIG_DEFAULT_FIELDS_MAX_COUNT;
    config.cmd_type = TEST_CMD_TYPE_STRING|TEST_CMD_TYPE_LIST|
        TEST_CMD_TYPE_SET|TEST_CMD_TYPE_ZSET|TEST_CMD_TYPE_HASH|
        TEST_CMD_TYPE_SERVER|TEST_CMD_TYPE_KEY;
    config.cmd_blacklist = NULL;
    config.cmd_whitelist = NULL;
    config.test_targets = CONFIG_DEFAULT_TEST_TARGET; 
    config.produce_data_threads = CONFIG_DEFAULT_PRODUCE_THREADS_COUNT;
    config.cached_keys_per_produce_thread = CONFIG_DEFAULT_CACHED_KEYS_COUNT;
    config.hit_ratio = CONFIG_DEFAULT_HIT_RATIO;
    config.dispatch_data_threads = CONFIG_DEFAULT_DISPATCH_THREADS_COUNT;
    config.clients_per_dispatch_thread = CONFIG_DEFAULT_CLIENTS_PER_DISPATCH_THREAD;
    config.log_filename = CONFIG_DEFAULT_LOGFILE;
    
    expire_enabled = 0;
}

static void
vrt_clean_options(void)
{
    if (config.cmd_blacklist != NULL) {
        sds *command;
        while (darray_n(config.cmd_blacklist) > 0) {
            command = darray_pop(config.cmd_blacklist);
            sdsfree(command);
        }
        darray_destroy(config.cmd_blacklist);
        config.cmd_blacklist = NULL;
    }

    if (config.cmd_whitelist != NULL) {
        sds *command;
        while (darray_n(config.cmd_whitelist) > 0) {
            command = darray_pop(config.cmd_whitelist);
            sdsfree(command);
        }
        darray_destroy(config.cmd_whitelist);
        config.cmd_whitelist = NULL;
    }
}

static int
vrt_get_options(int argc, char **argv)
{
    int c;
    long lvalue;
    long long llvalue;
    long long *range;
    int range_count;

    opterr = 0;

    for (;;) {
        c = getopt_long(argc, argv, short_options, long_options, NULL);
        if (c == -1) {
            /* no more options */
            break;
        }

        switch (c) {
        case 'h':
            show_version = 1;
            show_help = 1;
            break;

        case 'V':
            show_version = 1;
            break;
            
        case 'D':
            daemonize = 1;
            break;

        case 'E':
            expire_enabled = 1;
            break;
            
        case 'C':
            config.checker = optarg;
            break;

        case 'i':
            if (string2ll(optarg,strlen(optarg),&llvalue) != 1) {
                log_stderr("vireabtest: option -i requires a number");
                return VRT_ERROR;
            }
            config.test_interval = llvalue;
            break;
            
        case 'k':
            range = get_range_from_string(optarg,strlen(optarg),&range_count);
            if (range == NULL) {
                log_stderr("vireabtest: option -k is invalid, you need input a range like 0-100");
                return VRT_ERROR;
            }
            config.key_length_range_begin = (int)range[0];
            if (range_count == 1) config.key_length_range_end = (int)range[0];
            else if (range_count == 2) config.key_length_range_end = (int)range[1];
            else assert(0);

            free(range);
            
            break;

        case 's':
            if (string2l(optarg,strlen(optarg),&lvalue) != 1) {
                log_stderr("vireabtest: option -s requires a number");
                return VRT_ERROR;
            }
            config.string_max_length = (int)lvalue;
            break;

        case 'f':
            if (string2l(optarg,strlen(optarg),&lvalue) != 1) {
                log_stderr("vireabtest: option -f requires a number");
                return VRT_ERROR;
            }
            config.fields_max_count = (int)lvalue;
            break;
            
        case 'T':
            config.cmd_type = parse_command_types(optarg);
            if (config.cmd_type <= 0) {
                log_stderr("vireabtest: option -T requires the correct command types");
                return VRT_ERROR;
            }
            break;

        case 'B':
            config.cmd_blacklist = parse_command_list(optarg);
            if (config.cmd_blacklist == NULL) {
                log_stderr("vireabtest: option -B requires the correct command list");
                return VRT_ERROR;
            }
            break;

        case 'W':
            config.cmd_whitelist = parse_command_list(optarg);
            if (config.cmd_whitelist == NULL) {
                log_stderr("vireabtest: option -W requires the correct command list");
                return VRT_ERROR;
            }
            break;
            
        case 't':
            config.test_targets = optarg;
            break;

        case 'p':
            if (string2l(optarg,strlen(optarg),&lvalue) != 1) {
                log_stderr("vireabtest: option -p requires a number");
                return VRT_ERROR;
            }
            config.produce_data_threads = (int)lvalue;
            break;

        case 'K':
            if (string2ll(optarg,strlen(optarg),&llvalue) != 1) {
                log_stderr("vireabtest: option -K requires a number");
                return VRT_ERROR;
            }
            if (llvalue < 1000) {
                log_stderr("vireabtest: option -K requires a number that must bigger than 1000");
                return VRT_ERROR;
            }
            
            config.cached_keys_per_produce_thread = llvalue;
            break;

        case 'H':
            if (string2l(optarg,strlen(optarg),&lvalue) != 1) {
                log_stderr("vireabtest: option -H requires a number");
                return VRT_ERROR;
            }
            if (lvalue < 0 || lvalue > 100) {
                log_stderr("vireabtest: option hit-ratio need between 0 and 100");
                return VRT_ERROR;
            }
            config.hit_ratio = (int)lvalue;
            break;

        case 'd':
            if (string2l(optarg,strlen(optarg),&lvalue) != 1) {
                log_stderr("vireabtest: option -d requires a number");
                return VRT_ERROR;
            }
            config.dispatch_data_threads = (int)lvalue;
            break;

        case 'c':
            if (string2l(optarg,strlen(optarg),&lvalue) != 1) {
                log_stderr("vireabtest: option -c requires a number");
                return VRT_ERROR;
            }
            config.clients_per_dispatch_thread = (int)lvalue;
            break;
            
        case 'P':
            config.pid_filename = optarg;
            break;

        case 'o':
            config.log_filename = optarg;
            break;
            
        case '?':
            switch (optopt) {
            case 'C':
            case 'k':
            case 'T':
            case 'B':
            case 'W':
            case 't':
            case 'P':
            case 'o':
                log_stderr("vire: option -%c requires string",
                           optopt);
                break;

            case 'i':
            case 'p':
            case 'd':
            case 'c':
            case 's':
                log_stderr("vire: option -%c requires number",
                           optopt);
                break;
                
            default:
                log_stderr("vire: invalid option -- '%c'", optopt);
                break;
            }
            return VRT_ERROR;

        default:
            log_stderr("vire: invalid option -- '%c'", optopt);
            return VRT_ERROR;

        }
    }

    return VRT_OK;
}

static int vrt_daemonize(int dump_core)
{
    int ret;
    pid_t pid, sid;
    int fd;

    pid = fork();
    switch (pid) {
    case -1:
        log_error("fork() failed: %s", strerror(errno));
        return VRT_ERROR;

    case 0:
        break;

    default:
        /* parent terminates */
        _exit(0);
    }

    /* 1st child continues and becomes the session leader */

    sid = setsid();
    if (sid < 0) {
        log_error("setsid() failed: %s", strerror(errno));
        return VRT_ERROR;
    }

    if (signal(SIGHUP, SIG_IGN) == SIG_ERR) {
        log_error("signal(SIGHUP, SIG_IGN) failed: %s", strerror(errno));
        return VRT_ERROR;
    }

    pid = fork();
    switch (pid) {
    case -1:
        log_error("fork() failed: %s", strerror(errno));
        return VRT_ERROR;

    case 0:
        break;

    default:
        /* 1st child terminates */
        _exit(0);
    }

    /* 2nd child continues */

    /* change working directory */
    if (dump_core == 0) {
        ret = chdir("/");
        if (ret < 0) {
            log_error("chdir(\"/\") failed: %s", strerror(errno));
            return VRT_ERROR;
        }
    }

    /* clear file mode creation mask */
    umask(0);

    /* redirect stdin, stdout and stderr to "/dev/null" */

    fd = open("/dev/null", O_RDWR);
    if (fd < 0) {
        log_error("open(\"/dev/null\") failed: %s", strerror(errno));
        return VRT_ERROR;
    }

    ret = dup2(fd, STDIN_FILENO);
    if (ret < 0) {
        log_error("dup2(%d, STDIN) failed: %s", fd, strerror(errno));
        close(fd);
        return VRT_ERROR;
    }

    ret = dup2(fd, STDOUT_FILENO);
    if (ret < 0) {
        log_error("dup2(%d, STDOUT) failed: %s", fd, strerror(errno));
        close(fd);
        return VRT_ERROR;
    }

    ret = dup2(fd, STDERR_FILENO);
    if (ret < 0) {
        log_error("dup2(%d, STDERR) failed: %s", fd, strerror(errno));
        close(fd);
        return VRT_ERROR;
    }

    if (fd > STDERR_FILENO) {
        ret = close(fd);
        if (ret < 0) {
            log_error("close(%d) failed: %s", fd, strerror(errno));
            return VRT_ERROR;
        }
    }

    return VRT_OK;
}

static int abtest_server_init(abtest_server *abs, char *address)
{
    sds *host_port;
    int count;
    long value;

    abs->host = NULL;
    abs->port = 0;
    abs->conn_contexts = NULL;
    abs->data = NULL;

    host_port = sdssplitlen(address,strlen(address),":",1,&count);
    if (host_port == NULL) {
        return VRT_ERROR;
    } else if (count != 2) {
        sdsfreesplitres(host_port,count);
        return VRT_ERROR;
    }

    abs->host = host_port[0];
    host_port[0] = NULL;

    if (string2l(host_port[1],sdslen(host_port[1]),&value) != 1) {
        sdsfreesplitres(host_port,count);
        return VRT_ERROR;
    }

    abs->port = (int)value;
    sdsfreesplitres(host_port,count);
    
    return VRT_OK;
}

static void abtest_server_deinit(abtest_server *abs)
{
    if (abs->host) {
        sdsfree(abs->host);
        abs->host = NULL;
    }

    if (abs->port > 0) abs->port = 0;

    if (abs->conn_contexts) {
        ASSERT(darray_n(abs->conn_contexts) == 0);
        darray_destroy(abs->conn_contexts);
        abs->conn_contexts = NULL;
    }
}

unsigned int get_backend_server_idx(abtest_group *abg, char *key, size_t keylen)
{
    unsigned int hashvalue, servers_count;

    servers_count = darray_n(&abg->abtest_servers);
    if (servers_count == 1) {
        return 0;
    }

    hashvalue = (unsigned int)hash_crc32a(key, keylen);
    
    return hashvalue%servers_count;
}

abtest_server *get_backend_server(abtest_group *abg, char *key, size_t keylen)
{
    abtest_server *abs;
    unsigned int idx;

    idx = abg->get_backend_server_idx(abg,key,keylen);
    abs = darray_get(&abg->abtest_servers, idx);

    return abs;
}

static int abtest_group_init(abtest_group *abg, char *group_string)
{
    sds *type_addrs, *addrs;
    int type_addrs_count, addrs_count;
    int j;

    abg->type = 0;
    darray_init(&abg->abtest_servers, 1, sizeof(abtest_server));

    type_addrs = sdssplitlen(group_string,sdslen(group_string),"[",1,&type_addrs_count);
    if (type_addrs == NULL) {
        return VRT_ERROR;
    } else if (type_addrs_count != 2) {
        sdsfreesplitres(type_addrs,type_addrs_count);
        return VRT_ERROR;
    }

    if (!strcasecmp(type_addrs[0],"vire")) {
        abg->type = VRABTEST_GROUP_TYPE_VIRE;
    } else if (!strcasecmp(type_addrs[0],"redis")) {
        abg->type = VRABTEST_GROUP_TYPE_REDIS;
    } else {
        sdsfreesplitres(type_addrs,type_addrs_count);
        return VRT_ERROR;
    }

    if (sdslen(type_addrs[1]) <= 1 || 
        type_addrs[1][sdslen(type_addrs[1])-1] != ']') {
        sdsfreesplitres(type_addrs,type_addrs_count);
        return VRT_ERROR;
    }

    sdsrange(type_addrs[1],0,-2);

    addrs = sdssplitlen(type_addrs[1],sdslen(type_addrs[1]),",",1,&addrs_count);
    if (addrs == NULL) {
        sdsfreesplitres(type_addrs,type_addrs_count);
        return VRT_ERROR;
    } else if (addrs_count < 1) {
        sdsfreesplitres(addrs,addrs_count);
        sdsfreesplitres(type_addrs,type_addrs_count);
        return VRT_ERROR;
    }

    for (j = 0; j < addrs_count; j ++) {
        abtest_server *abs = darray_push(&abg->abtest_servers);
        if (abtest_server_init(abs,addrs[j]) != VRT_OK) {
            sdsfreesplitres(addrs,addrs_count);
            sdsfreesplitres(type_addrs,type_addrs_count);
            return VRT_ERROR;
        }
    }

    sdsfreesplitres(addrs,addrs_count);
    sdsfreesplitres(type_addrs,type_addrs_count);

    abg->get_backend_server_idx = get_backend_server_idx;
    abg->get_backend_server = get_backend_server;

    return VRT_OK;
}

static void abtest_group_deinit(abtest_group *abg)
{
    abtest_server *abs;
    
    abg->type = 0;
    
    while (darray_n(&abg->abtest_servers) > 0) {
        abs = darray_pop(&abg->abtest_servers);
        abtest_server_deinit(abs);
    }
    darray_deinit(&abg->abtest_servers);
}

/* groups_string is like "vire[127.0.0.1:12301,127.0.0.1:12302]-redis[127.0.0.1:12311,127.0.0.1:12312]" */
darray *abtest_groups_create(char *groups_string)
{
    darray *abgs;
    sds *group_strings;
    int group_count, j;

    group_strings = sdssplitlen(groups_string,strlen(groups_string),"-",1,&group_count);
    if (group_strings == NULL) {
        return NULL;
    } else if (group_count < 1) {
        sdsfreesplitres(group_strings,group_count);
        return NULL;
    }

    abgs = darray_create(2, sizeof(abtest_group));
    if (abgs == NULL) {
        sdsfreesplitres(group_strings,group_count);
        return NULL;
    }
    
    for (j = 0; j < group_count; j ++) {
        abtest_group *abg;
        sds group_string = group_strings[j];
        sds *type_addrs;
        int elem_count;

        abg = darray_push(abgs);
        if (abtest_group_init(abg,group_string) != VRT_OK) {
            sdsfreesplitres(group_strings,group_count);
            abtest_groups_destroy(abgs);
            return NULL;
        }
    }

    return abgs;
}

void abtest_groups_destroy(darray *abgs)
{
    while (darray_n(abgs) > 0) {
        abtest_group *abg = darray_pop(abgs);
        abtest_group_deinit(abg);
    }
    
    darray_destroy(abgs);
}

int
main(int argc, char **argv)
{
    int ret;

    vrt_set_default_options();

    ret = vrt_get_options(argc, argv);
    if (ret != VRT_OK) {
        vrt_show_usage();
        exit(1);
    }

    if (show_version) {
        log_stdout("This is vireabtest-%s", VR_VERSION_STRING);
        if (show_help) {
            vrt_show_usage();
        }
        exit(0);
    }

    ret = log_init(LOG_INFO, config.log_filename);
    if (ret < 0) {
        exit(1);
    }

    if (daemonize) {
        ret = vrt_daemonize(1);
        if (ret != VRT_OK) {
            exit(1);
        }
    }

    test_interval = config.test_interval;
    
    ret = vrt_produce_data_init(config.key_length_range_begin,
        config.key_length_range_end,
        config.string_max_length,config.fields_max_count,
        config.cmd_type,config.cmd_blacklist,config.cmd_whitelist,
        config.produce_data_threads,
        config.cached_keys_per_produce_thread, 
        config.hit_ratio);
    if (ret != VRT_OK) {
        log_error("Init data producer failed");
        exit(1);
    }
    ret = vrt_dispatch_data_init(config.dispatch_data_threads, 
        config.test_targets, config.clients_per_dispatch_thread);
    if (ret != VRT_OK) {
        log_error("Init data dispatcher failed");
        exit(1);
    }
    ret = vrt_backend_init(config.dispatch_data_threads, 
        config.test_targets);
    if (ret != VRT_OK) {
        log_error("Init backend thread failed");
        exit(1);
    }
    ret = vrt_data_checker_init(config.checker, config.test_targets);
    if (ret != VRT_OK) {
        log_error("Init check data thread failed");
        exit(1);
    }

    log_debug(LOG_INFO,"State lock type: %s", TEST_STATE_LOCK_TYPE);

    vrt_start_produce_data();
    vrt_start_dispatch_data();
    vrt_start_backend();
    vrt_start_data_checker();

    vrt_wait_produce_data();
    vrt_wait_dispatch_data();
    vrt_wait_backend();
    vrt_wait_data_checker();

    vrt_data_checker_deinit();
    vrt_backend_deinit();
    vrt_dispatch_data_deinit();
    vrt_produce_data_deinit();

    log_deinit();
    vrt_clean_options();
    
    return VRT_OK;
}


================================================
FILE: tests/vrabtest.h
================================================
#ifndef _VRABTEST_H_
#define _VRABTEST_H_

#include <darray.h>

struct redisContext;
struct redisAsyncContext;
struct abtest_group;

typedef struct conn_context {
    struct redisContext *ctx;
    struct redisAsyncContext *actx;    
} conn_context;

typedef struct abtest_server {
    sds host;
    int port;

    darray *conn_contexts;  /* connection context */

    void *data;
} abtest_server;

typedef unsigned int (*backend_server_idx_t)(struct abtest_group*, char *, size_t);
typedef abtest_server *(*backend_server_t)(struct abtest_group*, char *, size_t);

typedef struct abtest_group {
    int type;
    
    darray abtest_servers;    /* type: abtest_server */

    backend_server_idx_t    get_backend_server_idx;
    backend_server_t        get_backend_server;
} abtest_group;

extern int expire_enabled;
extern long long test_interval;
extern long long last_test_begin_time;

darray *abtest_groups_create(char *groups_string);
void abtest_groups_destroy(darray *abgs);

#endif


================================================
FILE: tests/vrt_backend.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <getopt.h>
#include <fcntl.h>
#include <errno.h>
#include <signal.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <hiredis.h>
#include <async.h>
#include <adapters/ae.h>

#include <dhashkit.h>
#include <dlist.h>
#include <dmtqueue.h>

#include <vrt_util.h>
#include <vrt_public.h>
#include <vrabtest.h>
#include <vrt_produce_data.h>
#include <vrt_dispatch_data.h>
#include <vrt_backend.h>

typedef struct task_data {
    long long maxmemory;
    long long used_memory;
    long long total_system_memory;
    
    int deleting;   /* backend thread is deleting keys */
    long long cursor;   /* scan cursor */
} task_data;

int backend_threads_count;
static darray *backend_threads = NULL;

int backend_threads_pause_finished_count;

static int task_data_create(void)
{
    task_data *td;

    td = malloc(sizeof(*td));

    td->maxmemory = 0;
    td->used_memory = 0;
    td->total_system_memory = 0;
    td->deleting = 0;
    td->cursor = 0;

    return td;
}

static void task_data_destroy(task_data *td)
{
    free(td);
}

static int backend_conn_context_init(conn_context *cc, char *host, int port)
{
    cc->ctx = NULL;
    cc->actx = NULL;

    cc->actx = redisAsyncConnect(host, port);
    if (cc->actx == NULL) {
        return VRT_ERROR;
    }
    
    return VRT_OK;
}

static void backend_conn_context_deinit(conn_context *cc)
{
    if (cc->ctx) {
        redisFree(cc->ctx);
        cc->ctx == NULL;
    }

    if (cc->actx) {
        redisAsyncFree(cc->actx);
        cc->actx == NULL;
    }
}

static void connect_callback(const redisAsyncContext *c, int status) {
    backend_thread *bt = c->data;
    if (status != REDIS_OK) {
        test_log_out("Error: %s\n", c->errstr);
        //aeStop(loop);
        return;
    }

    //test_log_out("Connected...\n");
}

static void disconnect_callback(const redisAsyncContext *c, int status) {
    backend_thread *bt = c->data;
    if (status != REDIS_OK) {
        test_log_out("Error: %s\n", c->errstr);
        //aeStop(loop);
        return;
    }

    //test_log_out("Disconnected...\n");
    //aeStop(loop);
}

static void scan_for_delete_callback(redisAsyncContext *c, void *r, void *privdata) {
    redisReply *reply = r, *reply_sub, *reply_elem;
    abtest_server *abs = privdata;
    task_data *td = abs->data;
    conn_context *cc;
    long long value;
    size_t k;
    
    if (reply == NULL) return;

    if (!td->deleting) {
        return;
    }

    if (reply->type != REDIS_REPLY_ARRAY) {
        return;
    }

    if (reply->elements != 2) {
        return;
    }

    reply_sub = reply->element[0];
    if (reply_sub->type != REDIS_REPLY_STRING || 
        string2ll(reply_sub->str,reply_sub->len,&value) != 1) {
        return;
    }

    td->cursor = value;

    reply_sub = reply->element[1];
    if (reply_sub->type != REDIS_REPLY_ARRAY) {
        return;
    }

    for (k = 0; k < reply_sub->elements; k ++) {
        reply_elem = reply_sub->element[k];
        if (reply_elem->type != REDIS_REPLY_STRING) {
            return;
        }

        data_unit *du = data_unit_get();
        du->dp = delete_data_producer;
        du->argc = 2;
        du->argv = malloc(du->argc*sizeof(sds));
        du->argv[0] = sdsnew(delete_data_producer->name);
        du->argv[1] = sdsnewlen(reply_elem->str,reply_elem->len);
        data_dispatch(du);
    }

    cc = darray_get(abs->conn_contexts, 0);
    redisAsyncCommand(cc->actx, scan_for_delete_callback, 
        abs, "scan %lld count 1000", td->cursor);
}

static void update_memory_callback(redisAsyncContext *c, void *r, void *privdata) {
    redisReply *reply = r;
    abtest_server *abs = privdata;
    task_data *td = abs->data;
    
    if (reply == NULL) return;

    td->used_memory = get_longlong_from_info_reply(reply, "used_memory");

    if (td->maxmemory == 0) {
        td->total_system_memory = get_longlong_from_info_reply(reply, "total_system_memory");
    }
}

static void update_maxmemory_callback(redisAsyncContext *c, void *r, void *privdata) {
    redisReply *reply = r;
    abtest_server *abs = privdata;
    task_data *td = abs->data;
    redisReply *reply_sub;
    long long value;
    
    if (reply == NULL) return;

    if (reply->type != REDIS_REPLY_ARRAY) {
        return;
    }

    if (reply->elements != 2) {
        return;
    }

    reply_sub = reply->element[0];
    if (reply_sub->type != REDIS_REPLY_STRING || 
        strcmp(reply_sub->str, "maxmemory")) {
        return;
    }

    reply_sub = reply->element[1];
    if (reply_sub->type != REDIS_REPLY_STRING || 
        string2ll(reply_sub->str,reply_sub->len,&value) != 1) {
        return;
    }

    td->maxmemory = value;
}

static void update_memory_info(darray *abgs)
{
    long long i, j;
    
    for (i = 0; i < darray_n(abgs); i ++) {
        abtest_group *abg = darray_get(abgs, i);
        for (j = 0; j < darray_n(&abg->abtest_servers); j ++) {
            abtest_server *abs = darray_get(&abg->abtest_servers, j);
            conn_context *cc = darray_get(abs->conn_contexts, 0);
            
            redisAsyncCommand(cc->actx, update_memory_callback, abs, "info memory");
            redisAsyncCommand(cc->actx, update_maxmemory_callback, abs, "config get maxmemory");
        }
    }
}

static void check_memory_enough(backend_thread *bt)
{
    long long i, j;
    darray *abgs = bt->abgs;
    
    for (i = 0; i < darray_n(abgs); i ++) {
        abtest_group *abg = darray_get(abgs, i);
        for (j = 0; j < darray_n(&abg->abtest_servers); j ++) {
            abtest_server *abs = darray_get(&abg->abtest_servers, j);
            task_data *td = abs->data;
            long long max_memory_allowed = 0;
            
            if (td->used_memory) {
                if (td->maxmemory) {
                    max_memory_allowed = td->maxmemory;
                } else if (td->total_system_memory) {
                    max_memory_allowed = td->total_system_memory;
                }

                if (max_memory_allowed) { 
                    if (td->used_memory*100/max_memory_allowed > 80) {
                        if (!td->deleting) {
                            conn_context *cc = darray_get(abs->conn_contexts, 0);
                            redisAsyncCommand(cc->actx, scan_for_delete_callback, 
                                abs, "scan %lld count 1000", td->cursor);
                            td->deleting = 1;
                            bt->deleting ++;
                        }
                    } else if (td->deleting) {
                        td->deleting = 0;
                        bt->deleting --;
                    }
                }
            }
        }
    }
}

static int backend_thread_cron(aeEventLoop *eventLoop, long long id, void *clientData)
{
    backend_thread *bt = clientData;
    
    ASSERT(eventLoop == bt->el);

    /* At the begin of this loop */
    if (bt->pause) {
        if (!test_if_need_pause()) {
            bt->pause = 0;
        } else {
            bt->cronloops ++;
            return 1000;
        }
    }

    update_memory_info(bt->abgs);
    check_memory_enough(bt);

    /* At the end of this loop */
    if (!bt->pause && test_if_need_pause() && !bt->deleting) {
        bt->pause = 1;
        one_backend_thread_paused();
    }
    
    bt->cronloops ++;
    return 1000/bt->hz;
}

static int backend_thread_init(backend_thread *bt, char *test_target_groups)
{
    int i, j, k;

    bt->id = 0;
    bt->thread_id = 0;
    bt->el = NULL;
    bt->hz = 10;
    bt->cronloops = 0;
    bt->deleting = 0;
    bt->pause = 0;
    
    bt->el = aeCreateEventLoop(1);
    if (bt->el == NULL) {
        return VRT_ERROR;
    }

    bt->abgs = abtest_groups_create(test_target_groups);
    if (bt->abgs == NULL) {
        return VRT_ERROR;
    }

    /* Init connection context for each server */
    for (i = 0; i < darray_n(bt->abgs); i ++) {
        abtest_group *abg = darray_get(bt->abgs, i);
        for (j = 0; j < darray_n(&abg->abtest_servers); j ++) {
            abtest_server *abs = darray_get(&abg->abtest_servers, j);
            
            abs->conn_contexts = darray_create(1, sizeof(conn_context));
            for (k = 0; k < 1; k ++) {
                conn_context *cc = darray_push(abs->conn_contexts);
                if (backend_conn_context_init(cc,abs->host,abs->port) != VRT_OK) {
                    return VRT_ERROR;
                }
                cc->actx->data = bt;
                redisAeAttach(bt->el, cc->actx);
                redisAsyncSetConnectCallback(cc->actx,connect_callback);
                redisAsyncSetDisconnectCallback(cc->actx,disconnect_callback);
            }

            abs->data = task_data_create();
        }
    }

    if (aeCreateTimeEvent(bt->el, 1, backend_thread_cron, bt, NULL) == AE_ERR) {
        return VRT_ERROR;
    }
    
    return VRT_OK;
}

static void backend_thread_deinit(backend_thread *bt)
{
    if (bt->el) {
        aeDeleteEventLoop(bt->el);
        bt->el = NULL;
    }

    if (bt->abgs) {
        int i, j, k;
        /* Deinit connection context for each server */
        for (i = 0; i < darray_n(bt->abgs); i ++) {
            abtest_group *abg = darray_get(bt->abgs, i);
            for (j = 0; j < darray_n(&abg->abtest_servers); j ++) {
                abtest_server *abs = darray_get(&abg->abtest_servers, j);
                while (darray_n(abs->conn_contexts) > 0) {
                    conn_context *cc = darray_pop(abs->conn_contexts);
                    backend_conn_context_deinit(cc);
                }

                if (abs->data) {
                    task_data_destroy(abs->data);
                    abs->data;
                }
            }
        }
        
        abtest_groups_destroy(bt->abgs);
        bt->abgs = NULL;
    }
}

int vrt_backend_init(int threads_count, char *test_target_groups)
{
    int j;
    
    backend_threads_count = threads_count;
    backend_threads = darray_create(threads_count, sizeof(backend_thread));
    if (backend_threads == NULL) {
        return VRT_ERROR;
    }

    for (j = 0; j < threads_count; j ++) {
        backend_thread *bt = darray_push(backend_threads);
        if (backend_thread_init(bt, test_target_groups) != VRT_OK) {
            return VRT_ERROR;
        }
        bt->id = j;
    }
    
    return VRT_OK;
}

void vrt_backend_deinit(void)
{
    if (backend_threads) {
        while (darray_n(backend_threads) > 0) {
            backend_thread *bt = darray_pop(backend_threads);
            backend_thread_deinit(bt);
        }
        darray_destroy(backend_threads);
        backend_threads = NULL;
    }
}

static void *vrt_backend_thread_run(void *args)
{
    backend_thread *bt = args;
    srand(vrt_usec_now()^(int)pthread_self());

    aeMain(bt->el);
    
    return NULL;
}

int vrt_start_backend(void)
{
    unsigned int i;
    for (i = 0; i < darray_n(backend_threads); i ++) {
        pthread_attr_t attr;
        backend_thread *bt;
        pthread_attr_init(&attr);
        bt = darray_get(backend_threads, i);
        pthread_create(&bt->thread_id, 
            &attr, vrt_backend_thread_run, bt);
    }
    
    return VRT_OK;
}

int vrt_wait_backend(void)
{
    unsigned int i;
    /* wait for the produce threads finish */
	for(i = 0; i < darray_n(backend_threads); i ++){
		backend_thread *bt = darray_get(backend_threads, i);
		pthread_join(bt->thread_id, NULL);
	}
    
    return VRT_OK;
}


================================================
FILE: tests/vrt_backend.h
================================================
#ifndef _VRT_BACKEND_H_
#define _VRT_BACKEND_H_

#include <darray.h>

struct abtest_group;
struct dlist;
struct dmtlist;
struct data_unit;
struct aeEventLoop;

typedef struct backend_thread {
    int id;
    pthread_t thread_id;
    
    struct aeEventLoop *el;
    int hz;
    int cronloops;          /* Number of times the cron function run */

    darray *abgs; /* type is abtest_group */

    int deleting;
    int pause;
} backend_thread;

extern int backend_threads_count;

extern int backend_threads_pause_finished_count;

int vrt_backend_init(int threads_count, char *test_target_groups);
void vrt_backend_deinit(void);

int vrt_start_backend(void);
int vrt_wait_backend(void);

#endif


================================================
FILE: tests/vrt_benchmark.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <getopt.h>
#include <fcntl.h>
#include <errno.h>
#include <signal.h>
#include <assert.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <ae.h>

#include <hiredis.h>
#include <sds.h>

#include <darray.h>
#include <dlist.h>
#include <dutil.h>
#include <dlog.h>

#include <vrt_util.h>
#include <vrt_public.h>
#include <himemcached.h>

#define TEST_CMD_PROTOCOL_REDIS     0
#define TEST_CMD_PROTOCOL_MEMCACHE  1

#define RANDPTR_INITIAL_SIZE 8

static struct config {
    const char *hostip;
    int hostport;
    const char *hostsocket;
    int numclients;
    int liveclients;
    int requests;
    int requests_issued;
    int requests_finished;
    int keysize;
    int datasize;
    int randomkeys;
    int randomkeys_keyspacelen;
    int randomfields;
    int randomfields_fieldspacelen;
    int keepalive;
    int pipeline;
    int showerrors;
    long long start;
    long long totlatency;
    long long *latency;
    const char *title;
    int quiet;
    int csv;
    int loop;
    int idlemode;
    int dbnum;
    sds dbnumstr;
    char *tests;
    char *types;
    char *auth;
    int threads_count;
    int protocol;
    int noinline;
} config;

typedef struct benchmark_thread {
    int id;
    pthread_t thread_id;
    
    struct aeEventLoop *el;
    int hz;
    int cronloops;          /* Number of times the cron function run */

    dlist *clients;
    int numclients;
    int liveclients;

    int requests;
    int requests_issued;
    int requests_finished;

    long long start;
    long long totlatency;
    long long *latency;
} benchmark_thread;

typedef struct _benchmark_client {
    benchmark_thread *bt;
    
    redisContext *rc;
    mcContext *mc;
    sds obuf;
    char **randkeyptr;      /* Pointers to :randkey: strings inside the command buf */
    size_t randkeylen;      /* Number of pointers in client->randkeyptr */
    size_t randkeyfree;     /* Number of unused pointers in client->randkeyptr */
    char **randfieldptr;    /* Pointers to :randfield: strings inside the command buf */
    size_t randfieldlen;    /* Number of pointers in client->randfieldptr */
    size_t randfieldfree;   /* Number of unused pointers in client->randfieldptr */
    size_t written;         /* Bytes of 'obuf' already written */
    long long start;        /* Start time of a request */
    long long latency;      /* Request latency */
    int pending;            /* Number of pending requests (replies to consume) */
    int prefix_pending;     /* If non-zero, number of pending prefix commands. Commands
                               such as auth and select are prefixed to the pipeline of
                               benchmark commands and discarded after the first send. */
    int prefixlen;          /* Size in bytes of the pending prefix commands */
} *benchmark_client;

static darray *bts; /* Benchmark threads */

/* Prototypes */
static void writeHandler(aeEventLoop *el, int fd, void *privdata, int mask);
static benchmark_client createClient(char *cmd, size_t len, benchmark_client from, benchmark_thread *thread);
static void createMissingClients(benchmark_client c);
static int showThroughput(struct aeEventLoop *eventLoop, long long id, void *clientData);

static void freeClient(benchmark_client c) {
    benchmark_thread *bt = c->bt;
    dlistNode *ln;

    if (bt->el) {
        aeDeleteFileEvent(bt->el,c->rc->fd,AE_WRITABLE);
        aeDeleteFileEvent(bt->el,c->rc->fd,AE_READABLE);
    }
    redisFree(c->rc);
    if (c->mc) {
        c->mc->fd = -1;
        memcachedFree(c->mc);
    }
    sdsfree(c->obuf);
    free(c->randkeyptr);
    free(c->randfieldptr);
    free(c);
    update_state_sub(bt->liveclients,1);
    ln = dlistSearchKey(bt->clients,c);
    ASSERT(ln != NULL);
    dlistDelNode(bt->clients,ln);
}

static void freeAllClients(dlist *clients) {
    dlistNode *ln = clients->head, *next;

    while(ln) {
        next = ln->next;
        freeClient(ln->value);
        ln = next;
    }
}

static void resetClient(benchmark_client c) {
    benchmark_thread *bt = c->bt;
    
    aeDeleteFileEvent(bt->el,c->rc->fd,AE_WRITABLE);
    aeDeleteFileEvent(bt->el,c->rc->fd,AE_READABLE);
    aeCreateFileEvent(bt->el,c->rc->fd,AE_WRITABLE,writeHandler,c);
    c->written = 0;
    c->pending = config.pipeline;
}

static void randomizeClientKey(benchmark_client c) {
    size_t i;

    for (i = 0; i < c->randkeylen; i++) {
        char *p = c->randkeyptr[i]+11;
        size_t r = random() % config.randomkeys_keyspacelen;
        size_t j;

        for (j = 0; j < 12; j++) {
            *p = '0'+r%10;
            r/=10;
            p--;
        }
    }
}

static void randomizeClientField(benchmark_client c) {
    size_t i;

    for (i = 0; i < c->randfieldlen; i++) {
        char *p = c->randfieldptr[i]+13;
        size_t r = random() % config.randomfields_fieldspacelen;
        size_t j;

        for (j = 0; j < 14; j++) {
            *p = '0'+r%10;
            r/=10;
            p--;
        }
    }
}


static void clientDone(benchmark_client c) {
    benchmark_thread *bt = c->bt;
    int requests_finished;

    update_state_get(bt->requests_finished,&requests_finished);
    if (requests_finished == bt->requests) {
        freeClient(c);
        aeStop(bt->el);
        return;
    }
    if (config.keepalive) {
        resetClient(c);
    } else {
        update_state_sub(bt->liveclients,1);
        createMissingClients(c);
        update_state_add(bt->liveclients,1);
        freeClient(c);
    }
}

static int benchmark_thread_init(benchmark_thread *bt, int requests, int numclients, char *cmd, size_t len)
{    
    benchmark_client c;
    
    bt->thread_id = 0;
    bt->el = NULL;
    bt->hz = 10;
    bt->cronloops = 0;
    bt->clients = NULL;
    bt->numclients = numclients;
    bt->liveclients = 0;
    bt->requests = requests;
    bt->requests_issued = 0;
    bt->requests_finished = 0;
    bt->start = 0;
    bt->totlatency = 0;
    bt->latency = NULL;

    bt->el = aeCreateEventLoop(1024*10);
    if (bt->el == NULL) {
        return VRT_ERROR;
    }

    bt->clients = dlistCreate();
    if (bt->clients == NULL) {
        return VRT_ERROR;
    }

    bt->latency = malloc(sizeof(long long)*bt->requests);

    c = createClient(cmd,len,NULL,bt);
    createMissingClients(c);

    if (bt->id == 0) {
        aeCreateTimeEvent(bt->el,1,showThroughput,NULL,NULL);
    }
    
    return VRT_OK;
}

static void benchmark_thread_deinit(benchmark_thread *bt)
{
    if (bt->clients) {
        freeAllClients(bt->clients);
        dlistRelease(bt->clients);
        bt->clients = NULL;
    }

    if (bt->el) {
        aeDeleteEventLoop(bt->el);
        bt->el = NULL;
    }
    
    if (bt->latency) {
        free(bt->latency);
        bt->latency = NULL;
    }
}

static void *benchmark_thread_run(void *args)
{
    benchmark_thread *bt = args;
    srand(vrt_usec_now()^(int)pthread_self());

    aeMain(bt->el);
    
    return NULL;
}

static int start_benchmark_threads_until_finish(void)
{
    int i;
    benchmark_thread *bt;
    
    for (i = 0; i < config.threads_count; i ++) {
        pthread_attr_t attr;
        pthread_attr_init(&attr);
        bt = darray_get(bts, i);
        pthread_create(&bt->thread_id, 
            &attr, benchmark_thread_run, bt);
    }

    for (i = 0; i < config.threads_count; i ++) {
        bt = darray_get(bts, i);
        pthread_join(bt->thread_id, NULL);
    }
    
    return VRT_OK;
}

static void readHandlerMC(aeEventLoop *el, int fd, void *privdata, int mask) {
    benchmark_client c = privdata;
    benchmark_thread *bt = c->bt;
    mcContext *mc = c->mc;
    int requests_finished;
    void *reply = NULL;
    UNUSED(el);
    UNUSED(fd);
    UNUSED(mask);

    /* Calculate latency only for the first read event. This means that the
     * server already sent the reply and we need to parse it. Parsing overhead
     * is not part of the latency, so calculate it only once, here. */
    if (c->latency < 0) c->latency = dusec_now()-(c->start);

    if (memcachedBufferRead(mc) != MC_OK) {
        fprintf(stderr,"Error: %s\n",mc->errstr);
        exit(1);
    } else {
        while(c->pending) {
            if (memcachedGetReply(mc,&reply) != MC_OK) {
                fprintf(stderr,"Error: %s\n",mc->errstr);
                exit(1);
            }
            
            if (reply != NULL) {
                if (reply == (void*)MC_REPLY_ERROR) {
                    fprintf(stderr,"Unexpected error reply, exiting...\n");
                    exit(1);
                }

                if (config.showerrors) {
                    static time_t lasterr_time = 0;
                    time_t now = time(NULL);
                    mcReply *r = reply;
                    if (r->type == MC_REPLY_ERROR && lasterr_time != now) {
                        lasterr_time = now;
                        printf("Error from server: %s\n", r->str);
                    }
                }

                freeMcReplyObject(reply);
                /* This is an OK for prefix commands such as auth and select.*/
                if (c->prefix_pending > 0) {
                    c->prefix_pending--;
                    c->pending--;
                    /* Discard prefix commands on first response.*/
                    if (c->prefixlen > 0) {
                        size_t j;
                        sdsrange(c->obuf, c->prefixlen, -1);
                        /* We also need to fix the pointers to the strings
                        * we need to randomize. */
                        for (j = 0; j < c->randkeylen; j++)
                            c->randkeyptr[j] -= c->prefixlen;
                        for (j = 0; j < c->randfieldlen; j++)
                            c->randfieldptr[j] -= c->prefixlen;
                        c->prefixlen = 0;
                    }
                    continue;
                }

                update_state_get(bt->requests_finished,&requests_finished);
                if (requests_finished < bt->requests) {
                    bt->latency[requests_finished] = c->latency;
                    update_state_add(bt->requests_finished,1);
                }
                c->pending--;
                if (c->pending == 0) {
                    clientDone(c);
                    break;
                }
            } else {
                break;
            }
        }
    }
}

static void readHandler(aeEventLoop *el, int fd, void *privdata, int mask) {
    benchmark_client c = privdata;
    benchmark_thread *bt = c->bt;
    int requests_finished;
    void *reply = NULL;
    UNUSED(el);
    UNUSED(fd);
    UNUSED(mask);

    /* Calculate latency only for the first read event. This means that the
     * server already sent the reply and we need to parse it. Parsing overhead
     * is not part of the latency, so calculate it only once, here. */
    if (c->latency < 0) c->latency = dusec_now()-(c->start);

    if (redisBufferRead(c->rc) != REDIS_OK) {
        fprintf(stderr,"Error: %s\n",c->rc->errstr);
        exit(1);
    } else {
        while(c->pending) {
            if (redisGetReply(c->rc,&reply) != REDIS_OK) {
                fprintf(stderr,"Error: %s\n",c->rc->errstr);
                exit(1);
            }
            if (reply != NULL) {
                if (reply == (void*)REDIS_REPLY_ERROR) {
                    fprintf(stderr,"Unexpected error reply, exiting...\n");
                    exit(1);
                }

                if (config.showerrors) {
                    static time_t lasterr_time = 0;
                    time_t now = time(NULL);
                    redisReply *r = reply;
                    if (r->type == REDIS_REPLY_ERROR && lasterr_time != now) {
                        lasterr_time = now;
                        printf("Error from server: %s\n", r->str);
                    }
                }

                freeReplyObject(reply);
                /* This is an OK for prefix commands such as auth and select.*/
                if (c->prefix_pending > 0) {
                    c->prefix_pending--;
                    c->pending--;
                    /* Discard prefix commands on first response.*/
                    if (c->prefixlen > 0) {
                        size_t j;
                        sdsrange(c->obuf, c->prefixlen, -1);
                        /* We also need to fix the pointers to the strings
                        * we need to randomize. */
                        for (j = 0; j < c->randkeylen; j++)
                            c->randkeyptr[j] -= c->prefixlen;
                        for (j = 0; j < c->randfieldlen; j++)
                            c->randfieldptr[j] -= c->prefixlen;
                        c->prefixlen = 0;
                    }
                    continue;
                }

                update_state_get(bt->requests_finished,&requests_finished);
                if (requests_finished < bt->requests) {
                    bt->latency[requests_finished] = c->latency;
                    update_state_add(bt->requests_finished,1);
                }
                c->pending--;
                if (c->pending == 0) {
                    clientDone(c);
                    break;
                }
            } else {
                break;
            }
        }
    }
}

static void writeHandler(aeEventLoop *el, int fd, void *privdata, int mask) {
    benchmark_client c = privdata;
    benchmark_thread *bt = c->bt;
    UNUSED(el);
    UNUSED(fd);
    UNUSED(mask);

    /* Initialize request when nothing was written. */
    if (c->written == 0) {
        /* Enforce upper bound to number of requests. */
        if (bt->requests_issued++ >= bt->requests) {
            freeClient(c);
            return;
        }

        /* Really initialize: randomize keys and set start time. */
        if (config.randomkeys) randomizeClientKey(c);
        if (config.randomfields) randomizeClientField(c);
        c->start = dusec_now();
        c->latency = -1;
    }

    if (sdslen(c->obuf) > c->written) {
        void *ptr = c->obuf+c->written;
        ssize_t nwritten = write(c->rc->fd,ptr,sdslen(c->obuf)-c->written);
        
        if (nwritten == -1) {
            if (errno != EPIPE)
                fprintf(stderr, "Writing to socket: %s\n", strerror(errno));
            freeClient(c);
            return;
        }
        c->written += nwritten;
        if (sdslen(c->obuf) == c->written) {
            aeDeleteFileEvent(bt->el,c->rc->fd,AE_WRITABLE);
            if (config.protocol == TEST_CMD_PROTOCOL_REDIS) {
                aeCreateFileEvent(bt->el,c->rc->fd,AE_READABLE,readHandler,c);
            } else if (config.protocol == TEST_CMD_PROTOCOL_MEMCACHE) {
                aeCreateFileEvent(bt->el,c->rc->fd,AE_READABLE,readHandlerMC,c);
            } else {
                NOT_REACHED();
            }
        }
    }
}

/* Create a benchmark client, configured to send the command passed as 'cmd' of
 * 'len' bytes.
 *
 * The command is copied N times in the client output buffer (that is reused
 * again and again to send the request to the server) accordingly to the configured
 * pipeline size.
 *
 * Also an initial SELECT command is prepended in order to make sure the right
 * database is selected, if needed. The initial SELECT will be discarded as soon
 * as the first reply is received.
 *
 * To create a client from scratch, the 'from' pointer is set to NULL. If instead
 * we want to create a client using another client as reference, the 'from' pointer
 * points to the client to use as reference. In such a case the following
 * information is take from the 'from' client:
 *
 * 1) The command line to use.
 * 2) The offsets of the __rand_key__ elements inside the command line, used
 *    for arguments randomization.
 *
 * Even when cloning another client, prefix commands are applied if needed.*/
static benchmark_client createClient(char *cmd, size_t len, benchmark_client from, benchmark_thread *thread) {
    int j;
    benchmark_thread *bt;
    benchmark_client c = malloc(sizeof(struct _benchmark_client));

    c->bt = NULL;
    c->rc = NULL;
    c->mc = NULL;
    c->obuf = NULL;
    c->randkeyptr = NULL;
    c->randkeylen = 0;
    c->randkeyfree = 0;
    c->randfieldptr = NULL;
    c->randfieldlen = 0;
    c->randfieldfree = 0;
    c->written = 0;
    c->start = 0;
    c->latency = 0;
    c->pending = 0;
    c->prefix_pending = 0;
    c->prefixlen = 0;
    
    if (from == NULL) {
        ASSERT(thread != NULL);
        bt = thread;
    } else {
        bt = from->bt;
    }

    c->bt = bt;

    if (config.hostsocket == NULL) {
        c->rc = redisConnectNonBlock(config.hostip,config.hostport);
    } else {
        c->rc = redisConnectUnixNonBlock(config.hostsocket);
    }
    if (c->rc->err) {
        fprintf(stderr,"Could not connect to Redis at ");
        if (config.hostsocket == NULL)
            fprintf(stderr,"%s:%d: %s\n",config.hostip,config.hostport,c->rc->errstr);
        else
            fprintf(stderr,"%s: %s\n",config.hostsocket,c->rc->errstr);
        exit(1);
    }
    /* Suppress hiredis cleanup of unused buffers for max speed. */
    c->rc->reader->maxbuf = 0;

    /* Build the request buffer:
     * Queue N requests accordingly to the pipeline size, or simply clone
     * the example client buffer. */
    c->obuf = sdsempty();
    /* Prefix the request buffer with AUTH and/or SELECT commands, if applicable.
     * These commands are discarded after the first response, so if the client is
     * reused the commands will not be used again. */
    c->prefix_pending = 0;
    if (config.auth) {
        char *buf = NULL;
        int len = redisFormatCommand(&buf, "AUTH %s", config.auth);
        c->obuf = sdscatlen(c->obuf, buf, len);
        free(buf);
        c->prefix_pending++;
    }

    /* If a DB number different than zero is selected, prefix our request
     * buffer with the SELECT command, that will be discarded the first
     * time the replies are received, so if the client is reused the
     * SELECT command will not be used again. */
    if (config.dbnum != 0) {
        c->obuf = sdscatprintf(c->obuf,"*2\r\n$6\r\nSELECT\r\n$%d\r\n%s\r\n",
            (int)sdslen(config.dbnumstr),config.dbnumstr);
        c->prefix_pending++;
    }
    c->prefixlen = sdslen(c->obuf);
    /* Append the request itself. */
    if (from) {
        c->obuf = sdscatlen(c->obuf,
            from->obuf+from->prefixlen,
            sdslen(from->obuf)-from->prefixlen);
    } else {
        for (j = 0; j < config.pipeline; j++)
            c->obuf = sdscatlen(c->obuf,cmd,len);
    }

    c->written = 0;
    c->pending = config.pipeline+c->prefix_pending;
    c->randkeyptr = NULL;
    c->randkeylen = 0;
    c->randfieldptr = NULL;
    c->randfieldlen = 0;

    /* Find substrings in the output buffer that need to be randomized. */
    if (config.randomkeys) {
        if (from) {
            c->randkeylen = from->randkeylen;
            c->randkeyfree = 0;
            c->randkeyptr = malloc(sizeof(char*)*c->randkeylen);
            /* copy the offsets. */
            for (j = 0; j < (int)c->randkeylen; j++) {
                c->randkeyptr[j] = c->obuf + (from->randkeyptr[j]-from->obuf);
                /* Adjust for the different select prefix length. */
                c->randkeyptr[j] += c->prefixlen - from->prefixlen;
            }
        } else {
            char *p = c->obuf;

            c->randkeylen = 0;
            c->randkeyfree = RANDPTR_INITIAL_SIZE;
            c->randkeyptr = malloc(sizeof(char*)*c->randkeyfree);
            while ((p = strstr(p,"__rand_key__")) != NULL) {
                if (c->randkeyfree == 0) {
                    c->randkeyptr = realloc(c->randkeyptr,sizeof(char*)*c->randkeylen*2);
                    c->randkeyfree += c->randkeylen;
                }
                c->randkeyptr[c->randkeylen++] = p;
                c->randkeyfree--;
                p += 12; /* 12 is strlen("__rand_key__"). */
            }
        }
    }
    if (config.randomfields) {
        if (from) {
            c->randfieldlen = from->randfieldlen;
            c->randfieldfree = 0;
            c->randfieldptr = malloc(sizeof(char*)*c->randfieldlen);
            /* copy the offsets. */
            for (j = 0; j < (int)c->randfieldlen; j++) {
                c->randfieldptr[j] = c->obuf + (from->randfieldptr[j]-from->obuf);
                /* Adjust for the different select prefix length. */
                c->randfieldptr[j] += c->prefixlen - from->prefixlen;
            }
        } else {
            char *p = c->obuf;

            c->randfieldlen = 0;
            c->randfieldfree = RANDPTR_INITIAL_SIZE;
            c->randfieldptr = malloc(sizeof(char*)*c->randfieldfree);
            while ((p = strstr(p,"__rand_field__")) != NULL) {
                if (c->randfieldfree == 0) {
                    c->randfieldptr = realloc(c->randfieldptr,sizeof(char*)*c->randfieldlen*2);
                    c->randfieldfree += c->randfieldlen;
                }
                c->randfieldptr[c->randfieldlen++] = p;
                c->randfieldfree--;
                p += 14; /* 14 is strlen("__rand_field__"). */
            }
        }
    }
    if (config.idlemode == 0)
        aeCreateFileEvent(bt->el,c->rc->fd,AE_WRITABLE,writeHandler,c);

    /* Attach the redis fd to memcached fd */
    if (config.protocol == TEST_CMD_PROTOCOL_MEMCACHE) {
        c->mc = memcachedContextInit();
        c->mc->fd = c->rc->fd;
        c->mc->flags &= ~MC_BLOCK;
    }
    
    dlistAddNodeTail(bt->clients,c);
    update_state_add(bt->liveclients,1);

    return c;
}

static void createMissingClients(benchmark_client c) {
    int n = 0;
    benchmark_thread *bt = c->bt;
    int liveclients;

    update_state_get(bt->liveclients,&liveclients);
    
    while(liveclients < bt->numclients) {
        createClient(NULL,0,c,NULL);

        /* Listen backlog is quite limited on most systems */
        if (++n > 64) {
            usleep(50000);
            n = 0;
        }
        update_state_get(bt->liveclients,&liveclients);
    }
}

static int compareLatency(const void *a, const void *b) {
    return (*(long long*)a)-(*(long long*)b);
}

static void updateBenchmarkStats(void)
{
    int i;
    int count;

    config.liveclients = 0;
    config.requests_finished = 0;

    for (i = 0; i < config.threads_count; i ++) {
        benchmark_thread *bt = darray_get(bts, i);
        update_state_get(bt->liveclients,&count);
        config.liveclients += count;
        update_state_get(bt->requests_finished,&count);
        config.requests_finished += count;
    }
}

static void showLatencyReport(void) {
    int i, j, curlat = 0;
    int n = 0;
    float perc, reqpersec;

    updateBenchmarkStats();

    reqpersec = (float)config.requests_finished/((float)config.totlatency/1000);
    if (!config.quiet && !config.csv) {
        printf("====== %s ======\n", config.title);
        printf("  %d requests completed in %.2f seconds\n", config.requests_finished,
            (float)config.totlatency/1000);
        printf("  %d parallel clients\n", config.numclients);
        printf("  %d bytes payload\n", config.datasize);
        printf("  keep alive: %d\n", config.keepalive);
        printf("\n");

        for (i = 0; i < config.threads_count; i++) {
            benchmark_thread *bt = darray_get(bts, i);
            for (j = 0; j < bt->requests; j ++) {
                config.latency[n++] = bt->latency[j];
            }
        }
        
        qsort(config.latency,config.requests,sizeof(long long),compareLatency);
        for (i = 0; i < config.requests; i++) {
            if (config.latency[i]/1000 != curlat || i == (config.requests-1)) {
                curlat = config.latency[i]/1000;
                perc = ((float)(i+1)*100)/config.requests;
                printf("%.2f%% <= %d milliseconds\n", perc, curlat);
            }
        }
        printf("%.2f requests per second\n\n", reqpersec);
    } else if (config.csv) {
        printf("\"%s\",\"%.2f\"\n", config.title, reqpersec);
    } else {
        printf("%s: %.2f requests per second\n", config.title, reqpersec);
    }
}

static void benchmark(char *title, char *cmd, int len) {
    int i;
    int requests_per_thread, requests_remainder;
    int clients_per_thread, clients_remainder;
    benchmark_client c;

    config.title = title;
    config.requests_issued = 0;
    config.requests_finished = 0;
    
    requests_per_thread = config.requests/config.threads_count;
    requests_remainder = config.requests%config.threads_count;
    clients_per_thread = config.numclients/config.threads_count;
    clients_remainder = config.numclients%config.threads_count;

    bts = darray_create(config.threads_count, sizeof(benchmark_thread));
    for (i = 0; i < config.threads_count; i ++) {
        benchmark_thread *bt = darray_push(bts);
        bt->id = i;
        benchmark_thread_init(bt,
            requests_remainder-->0?requests_per_thread+1:requests_per_thread,
            clients_remainder-->0?clients_per_thread+1:clients_per_thread,
            cmd,len);
    }

    config.start = dmsec_now();
    start_benchmark_threads_until_finish();
    config.totlatency = dmsec_now()-config.start;

    showLatencyReport();

    while (darray_n(bts) > 0) {
        benchmark_thread *bt = darray_pop(bts);
        benchmark_thread_deinit(bt);
    }
    darray_destroy(bts);
    bts = NULL;
}

/* Returns number of consumed options. */
int parseOptions(int argc, const char **argv) {
    int i;
    int lastarg;
    int exit_status = 1;

    for (i = 1; i < argc; i++) {
        lastarg = (i == (argc-1));

        if (!strcmp(argv[i],"-c")) {
            if (lastarg) goto invalid;
            config.numclients = atoi(argv[++i]);
        } else if (!strcmp(argv[i],"-n")) {
            if (lastarg) goto invalid;
            config.requests = atoi(argv[++i]);
        } else if (!strcmp(argv[i],"-k")) {
            if (lastarg) goto invalid;
            config.keepalive = atoi(argv[++i]);
        } else if (!strcmp(argv[i],"-h")) {
            if (lastarg) goto invalid;
            config.hostip = strdup(argv[++i]);
        } else if (!strcmp(argv[i],"-p")) {
            if (lastarg) goto invalid;
            config.hostport = atoi(argv[++i]);
        } else if (!strcmp(argv[i],"-s")) {
            if (lastarg) goto invalid;
            config.hostsocket = strdup(argv[++i]);
        } else if (!strcmp(argv[i],"-a") ) {
            if (lastarg) goto invalid;
            config.auth = strdup(argv[++i]);
        } else if (!strcmp(argv[i],"-d")) {
            if (lastarg) goto invalid;
            config.datasize = atoi(argv[++i]);
            if (config.datasize < 1) config.datasize=1;
            if (config.datasize > 1024*1024*1024) config.datasize = 1024*1024*1024;
        } else if (!strcmp(argv[i],"-P")) {
            if (lastarg) goto invalid;
            config.pipeline = atoi(argv[++i]);
            if (config.pipeline <= 0) config.pipeline=1;
        } else if (!strcmp(argv[i],"-r")) {
            if (lastarg) goto invalid;
            config.randomkeys = 1;
            config.randomkeys_keyspacelen = atoi(argv[++i]);
            if (config.randomkeys_keyspacelen < 0)
                config.randomkeys_keyspacelen = 0;
        } else if (!strcmp(argv[i],"-f")) {
            if (lastarg) goto invalid;
            config.randomfields = 1;
            config.randomfields_fieldspacelen = atoi(argv[++i]);
            if (config.randomfields_fieldspacelen < 0)
                config.randomfields_fieldspacelen = 0;
        } else if (!strcmp(argv[i],"-q")) {
            config.quiet = 1;
        } else if (!strcmp(argv[i],"--csv")) {
            config.csv = 1;
        } else if (!strcmp(argv[i],"-l")) {
            config.loop = 1;
        } else if (!strcmp(argv[i],"-I")) {
            config.idlemode = 1;
        } else if (!strcmp(argv[i],"-e")) {
            config.showerrors = 1;
        } else if (!strcmp(argv[i],"-t")) {
            if (lastarg) goto invalid;
            /* We get the list of tests to run as a string in the form
             * get,set,lrange,...,test_N. Then we add a comma before and
             * after the string in order to make sure that searching
             * for ",testname," will always get a match if the test is
             * enabled. */
            config.tests = sdsnew(",");
            config.tests = sdscat(config.tests,(char*)argv[++i]);
            config.tests = sdscat(config.tests,",");
            sdstolower(config.tests);
        } else if (!strcmp(argv[i],"-S")) {
            if (lastarg) goto invalid;
            /* We get the list of redis special type commands to run as a string in the form
             * server,list,string,hash,set,...,sortedset. Then we add a comma before and
             * after the string in order to make sure that searching
             * for ",typename," will always get a match if the type is
             * enabled. */
            config.types = sdsnew(",");
            config.types = sdscat(config.types,(char*)argv[++i]);
            config.types = sdscat(config.types,",");
            sdstolower(config.types);
        } else if (!strcmp(argv[i],"--dbnum")) {
            if (lastarg) goto invalid;
            config.dbnum = atoi(argv[++i]);
            config.dbnumstr = sdsfromlonglong(config.dbnum);
        } else if (!strcmp(argv[i],"-T")) {
            if (lastarg) goto invalid;
            config.threads_count = atoi(argv[++i]);
        } else if (!strcmp(argv[i],"-m")) {
            config.protocol = TEST_CMD_PROTOCOL_MEMCACHE;
        } else if (!strcmp(argv[i],"--noinline")) {
            config.noinline = 1;
        } else if (!strcmp(argv[i],"--help")) {
            exit_status = 0;
            goto usage;
        } else {
            /* Assume the user meant to provide an option when the arg starts
             * with a dash. We're done otherwise and should use the remainder
             * as the command and arguments for running the benchmark. */
            if (argv[i][0] == '-') goto invalid;
            return i;
        }
    }

    return i;

invalid:
    printf("Invalid option \"%s\" or option argument missing\n\n",argv[i]);

usage:
    printf(
"Usage: vire-benchmark [-h <host>] [-p <port>] [-c <clients>] [-n <requests]> [-k <boolean>]\n\n"
" -h <hostname>      Server hostname (default 127.0.0.1)\n"
" -p <port>          Server port (default 6379)\n"
" -s <socket>        Server socket (overrides host and port)\n"
" -a <password>      Password for Redis Auth\n"
" -c <clients>       Number of parallel connections (default 100)\n"
" -n <requests>      Total number of requests (default 1000000)\n"
" -T <threads>       Threads count to run (default 2)\n"
" -d <size>          Data size of SET/GET/... value in bytes (default 16)\n"
" -dbnum <db>        SELECT the specified db number (default 0)\n"
" -k <boolean>       1=keep alive 0=reconnect (default 1)\n"
" -r <keyspacelen>   Use random keys for SET/GET/INCR/... (default 10000)\n"
"  Using this option the benchmark will expand the string __rand_key__\n"
"  inside an argument with a 12 digits number in the specified range\n"
"  from 0 to keyspacelen-1. The substitution changes every time a command\n"
"  is executed. Default tests use this to hit random keys in the\n"
"  specified range.\n"
" -f <fieldspacelen>   Use random fields for SADD/HSET/... (default 100)\n"
"  Using this option the benchmark will expand the string __rand_field__\n"
"  inside an argument with a 14 digits number in the specified range\n"
"  from 0 to fieldspacelen-1. The substitution changes every time a command\n"
"  is executed. Default tests use this to hit random fields in the\n"
"  specified range.\n"
" -P <numreq>        Pipeline <numreq> requests. Default 1 (no pipeline).\n"
" -e                 If server replies with errors, show them on stdout.\n"
"                    (no more than 1 error per second is displayed)\n"
" -q                 Quiet. Just show query/sec values\n"
" --csv              Output in CSV format\n"
" -l                 Loop. Run the tests forever\n"
" -t <tests>         Only run the comma separated list of tests. The test\n"
"                    names are the same as the ones produced as output.\n"
" -S <types>         Only run the comma separated list of the redis special types commands.\n"
"                    The type names are like 'server,string,hash,list,set,sortedset'.\n"
" -I                 Idle mode. Just open N idle connections and wait.\n"
" -m                 Use memcached protocol. This option is used for testing memcached.\n"
" --noinline         Not test redis inline commands.\n\n"
"Examples:\n\n"
" Run the benchmark with the default configuration against 127.0.0.1:6379:\n"
"   $ vire-benchmark\n\n"
" Use 20 parallel clients, for a total of 100k requests, against 192.168.1.1:\n"
"   $ vire-benchmark -h 192.168.1.1 -p 6379 -n 100000 -c 20\n\n"
" Fill 127.0.0.1:6379 with about 1 million keys only using the SET test:\n"
"   $ vire-benchmark -t set -n 1000000 -r 100000000\n\n"
" Benchmark 127.0.0.1:6379 for a few commands producing CSV output:\n"
"   $ vire-benchmark -t ping,set,get -n 100000 --csv\n\n"
" Benchmark a specific command line:\n"
"   $ vire-benchmark -r 10000 -n 10000 eval 'return redis.call(\"ping\")' 0\n\n"
" Fill a list with 10000 random elements:\n"
"   $ vire-benchmark -r 10000 -n 10000 lpush mylist __rand_field__\n\n"
" On user specified command lines __rand_key__ and __rand_field__ are replaced\n"
" with a random integer with a range of values selected by the -r and -f option.\n"
    );
    exit(exit_status);
}

static int showThroughput(struct aeEventLoop *eventLoop, long long id, void *clientData) {
    UNUSED(eventLoop);
    UNUSED(id);
    UNUSED(clientData);

    updateBenchmarkStats();

    if (config.liveclients == 0) {
        fprintf(stderr,"All clients disconnected... aborting.\n");
        exit(1);
    }
    if (config.csv) return 250;
    if (config.idlemode == 1) {
        printf("clients: %d\r", config.liveclients);
        fflush(stdout);
	    return 250;
    }
    float dt = (float)(dmsec_now()-config.start)/1000.0;
    float rps = (float)config.requests_finished/dt;
    printf("%s: %.2f\r", config.title, rps);
    fflush(stdout);
    return 250; /* every 250ms */
}

/* Return true if the named test was selected using the -t command line
 * switch, or if all the tests are selected (no -t passed by user). */
int test_is_selected(char *name) {
    char buf[256];
    int l = strlen(name);

    if (config.tests == NULL) return 1;
    buf[0] = ',';
    memcpy(buf+1,name,l);
    buf[l+1] = ',';
    buf[l+2] = '\0';
    return strstr(config.tests,buf) != NULL;
}

int types_is_selected(char *name) {
    char buf[256];
    int l = strlen(name);

    if (config.types == NULL) return 1;
    buf[0] = ',';
    memcpy(buf+1,name,l);
    buf[l+1] = ',';
    buf[l+2] = '\0';
    return strstr(config.types,buf) != NULL;
}

static int requests_temporarily_stats = 0;
static int requests_original = 0;
void set_requests_temporarily(int num) {
    if (requests_temporarily_stats != 0) return;
    requests_original = config.requests;
    config.requests = num;
    requests_temporarily_stats = 1;
}
void retrieval_requests_to_original() {
    if (requests_temporarily_stats != 1) return;
    config.requests = requests_original;
    requests_original = 0;
    requests_temporarily_stats = 0;
}

static int random_keys_temporarily_stats = 0;
static int randomkeys_original = 0;
static int randomkeys_keyspacelen_original = 0;
void set_random_keys_temporarily(int num) {
    if (random_keys_temporarily_stats != 0) return;
    randomkeys_original = config.randomkeys;
    randomkeys_keyspacelen_original = config.randomkeys_keyspacelen;
    config.randomkeys = 1;
    config.randomkeys_keyspacelen = num;
    random_keys_temporarily_stats = 1;
}
void retrieval_random_keys_to_original() {
    if (random_keys_temporarily_stats != 1) return;
    config.randomkeys = randomkeys_original;
    config.randomkeys_keyspacelen = randomkeys_keyspacelen_original;
    randomkeys_original = 0;
    randomkeys_keyspacelen_original = 0;
    random_keys_temporarily_stats = 0;
}

static int test_redis(int argc, const char **argv)
{
    int i;
    char *data, *cmd;
    int len;

    /* Run benchmark with command in the remainder of the arguments. */
    if (argc) {
        sds title = sdsnew(argv[0]);
        for (i = 1; i < argc; i++) {
            title = sdscatlen(title, " ", 1);
            title = sdscatlen(title, (char*)argv[i], strlen(argv[i]));
        }

        do {
            len = redisFormatCommandArgv(&cmd,argc,argv,NULL);
            benchmark(title,cmd,len);
            free(cmd);
        } while(config.loop);

        return 0;
    }

    /* Run default benchmark suite. */
    data = malloc(config.datasize+1);
    do {
        memset(data,'x',config.datasize);
        data[config.datasize] = '\0';

        if (!config.noinline && 
            (test_is_selected("ping_inline") ||
            test_is_selected("ping")) &&
            types_is_selected("server"))
            benchmark("PING_INLINE","PING\r\n",6);

        if ((test_is_selected("ping_mbulk") ||
            test_is_selected("ping")) &&
            types_is_selected("server")) {
            len = redisFormatCommand(&cmd,"PING");
            benchmark("PING_BULK",cmd,len);
            free(cmd);
        }

        if (test_is_selected("set") && types_is_selected("string")) {
            len = redisFormatCommand(&cmd,"SET mystring:__rand_key__ %s",data);
            benchmark("SET",cmd,len);
            free(cmd);
        }

        if (test_is_selected("get") && types_is_selected("string")) {
            len = redisFormatCommand(&cmd,"GET mystring:__rand_key__");
            benchmark("GET",cmd,len);
            free(cmd);
        }

        if (test_is_selected("incr") && types_is_selected("string")) {
            len = redisFormatCommand(&cmd,"INCR mycounter:__rand_key__");
            benchmark("INCR",cmd,len);
            free(cmd);
        }

        if (test_is_selected("mset") && types_is_selected("string")) {
            const char *argv[21];
            argv[0] = "MSET";
            for (i = 1; i < 21; i += 2) {
                argv[i] = "mystring:__rand_key__";
                argv[i+1] = data;
            }
            len = redisFormatCommandArgv(&cmd,21,argv,NULL);
            benchmark("MSET (10 keys)",cmd,len);
            free(cmd);
        }

        if ((test_is_selected("mget") ||
            test_is_selected("mget_10")) &&
            types_is_selected("string")) {
            const char *argv[11];
            argv[0] = "MGET";
            for (i = 1; i < 11; i ++) {
                argv[i] = "mystring:__rand_key__";
            }
            len = redisFormatCommandArgv(&cmd,11,argv,NULL);
            benchmark("MGET (10 keys)",cmd,len);
            free(cmd);
        }

        if ((test_is_selected("mget") ||
            test_is_selected("mget_100"))
            && types_is_selected("string")) {
            const char *argv[101];
            argv[0] = "MGET";
            for (i = 1; i < 101; i ++) {
                argv[i] = "mystring:__rand_key__";
            }
            len = redisFormatCommandArgv(&cmd,101,argv,NULL);
            benchmark("MGET (100 keys)",cmd,len);
            free(cmd);
        }

        if ((test_is_selected("mget") ||
            test_is_selected("mget_200")) &&
            types_is_selected("string")) {
            const char *argv[201];
            argv[0] = "MGET";
            for (i = 1; i < 201; i ++) {
                argv[i] = "mystring:__rand_key__";
            }
            len = redisFormatCommandArgv(&cmd,201,argv,NULL);
            benchmark("MGET (200 keys)",cmd,len);
            free(cmd);
        }

        if (test_is_selected("lpush") && types_is_selected("list")) {
            len = redisFormatCommand(&cmd,"LPUSH mylist:__rand_key__ %s",data);
            benchmark("LPUSH",cmd,len);
            free(cmd);
        }

        if (test_is_selected("rpush") && types_is_selected("list")) {
            len = redisFormatCommand(&cmd,"RPUSH mylist:__rand_key__ %s",data);
            benchmark("RPUSH",cmd,len);
            free(cmd);
        }

        if (test_is_selected("lpop") && types_is_selected("list")) {
            len = redisFormatCommand(&cmd,"LPOP mylist:__rand_key__");
            benchmark("LPOP",cmd,len);
            free(cmd);
        }

        if (test_is_selected("rpop") && types_is_selected("list")) {
            len = redisFormatCommand(&cmd,"RPOP mylist:__rand_key__");
            benchmark("RPOP",cmd,len);
            free(cmd);
        }

        if ((test_is_selected("lrange") ||
            test_is_selected("lrange_10") ||
            test_is_selected("lrange_100") ||
            test_is_selected("lrange_300") ||
            test_is_selected("lrange_450") ||
            test_is_selected("lrange_600")) &&
            types_is_selected("list"))
        {
            set_random_keys_temporarily(1000);
            if (config.requests < 1000*1000)
                set_requests_temporarily(1000*1000);
            len = redisFormatCommand(&cmd,"LPUSH mylist:__rand_key__ %s",data);
            benchmark("LPUSH (needed to benchmark LRANGE)",cmd,len);
            free(cmd);
            retrieval_requests_to_original();
            retrieval_random_keys_to_original();
        }

        if ((test_is_selected("lrange") || 
            test_is_selected("lrange_10")) &&
            types_is_selected("list")) {
            set_random_keys_temporarily(1000);
            if (config.requests > 500*1000)
                set_requests_temporarily(500*1000);
            len = redisFormatCommand(&cmd,"LRANGE mylist:__rand_key__ 0 9");
            benchmark("LRANGE_10 (first 10 elements)",cmd,len);
            free(cmd);
            retrieval_requests_to_original();
            retrieval_random_keys_to_original();
        }

        if ((test_is_selected("lrange") || 
            test_is_selected("lrange_100")) &&
            types_is_selected("list")) {
            set_random_keys_temporarily(1000);
            if (config.requests > 320000)
                set_requests_temporarily(320000);
            len = redisFormatCommand(&cmd,"LRANGE mylist:__rand_key__ 0 99");
            benchmark("LRANGE_100 (first 100 elements)",cmd,len);
            free(cmd);
            retrieval_requests_to_original();
            retrieval_random_keys_to_original();
        }

        if ((test_is_selected("lrange") ||
            test_is_selected("lrange_300")) &&
            types_is_selected("list")) {
            set_random_keys_temporarily(1000);
            if (config.requests > 160000)
                set_requests_temporarily(160000);
            len = redisFormatCommand(&cmd,"LRANGE mylist:__rand_key__ 0 299");
            benchmark("LRANGE_300 (first 300 elements)",cmd,len);
            free(cmd);
            retrieval_requests_to_original();
            retrieval_random_keys_to_original();
        }

        if ((test_is_selected("lrange") ||
            test_is_selected("lrange_450")) &&
            types_is_selected("list")) {
            set_random_keys_temporarily(1000);
            if (config.requests > 100000)
                set_requests_temporarily(100000);
            len = redisFormatCommand(&cmd,"LRANGE mylist:__rand_key__ 0 449");
            benchmark("LRANGE_450 (first 450 elements)",cmd,len);
            free(cmd);
            retrieval_requests_to_original();
            retrieval_random_keys_to_original();
        }

        if ((test_is_selected("lrange") ||
            test_is_selected("lrange_600")) &&
            types_is_selected("list")) {
            set_random_keys_temporarily(1000);
            if (config.requests > 100000)
                set_requests_temporarily(100000);
            len = redisFormatCommand(&cmd,"LRANGE mylist:__rand_key__ 0 599");
            benchmark("LRANGE_600 (first 600 elements)",cmd,len);
            free(cmd);
            retrieval_requests_to_original();
            retrieval_random_keys_to_original();
        }

        if (test_is_selected("sadd") && types_is_selected("set")) {
            len = redisFormatCommand(&cmd,
                "SADD myset:__rand_key__ %s:__rand_field__", data);
            benchmark("SADD",cmd,len);
            free(cmd);
        }

        if (test_is_selected("spop") && types_is_selected("set")) {
            len = redisFormatCommand(&cmd,"SPOP myset:__rand_key__");
            benchmark("SPOP",cmd,len);
            free(cmd);
        }

        if (test_is_selected("hset") && types_is_selected("hash")) {
            len = redisFormatCommand(&cmd,"HSET myhash:__rand_key__ field:__rand_field__ %s", data);
            benchmark("HSET",cmd,len);
            free(cmd);
        }

        if (test_is_selected("hincrby") && types_is_selected("hash")) {
            len = redisFormatCommand(&cmd,"HINCRBY myhashcounter:__rand_key__ field:__rand_field__ 19");
            benchmark("HINCRBY",cmd,len);
            free(cmd);
        }

        if (test_is_selected("hincrbyfloat") && types_is_selected("hash")) {
            len = redisFormatCommand(&cmd,"HINCRBYFLOAT myhashcounterf:__rand_key__ field:__rand_field__ 19.963");
            benchmark("HINCRBYFLOAT",cmd,len);
            free(cmd);
        }

        if (test_is_selected("hget") && types_is_selected("hash")) {
            len = redisFormatCommand(&cmd,"HGET myhash:__rand_key__ field:__rand_field__");
            benchmark("HGET",cmd,len);
            free(cmd);
        }

        if (test_is_selected("hmset") && types_is_selected("hash")) {
            const char *argv[21];
            argv[0] = "HMSET";
            argv[1] = "myhashm:__rand_key__";
            for (i = 2; i < 22; i += 2) {
                argv[i] = "field:__rand_field__";
                argv[i+1] = data;
            }
            len = redisFormatCommandArgv(&cmd,22,argv,NULL);
            benchmark("HMSET (10 fields)",cmd,len);
            free(cmd);
        }

        if (test_is_selected("hmget") && types_is_selected("hash")) {
            const char *argv[21];
            argv[0] = "HMGET";
            argv[1] = "myhashm:__rand_key__";
            for (i = 2; i < 12; i ++) {
                argv[i] = "field:__rand_field__";
            }
            len = redisFormatCommandArgv(&cmd,12,argv,NULL);
            benchmark("HMGET (10 fields)",cmd,len);
            free(cmd);
        }

        if (test_is_selected("hgetall") && types_is_selected("hash")) {
            len = redisFormatCommand(&cmd,"HGETALL myhash:__rand_key__");
            benchmark("HGETALL",cmd,len);
            free(cmd);
        }

        if (test_is_selected("zadd") && types_is_selected("sortedset")) {
            len = redisFormatCommand(&cmd,"ZADD mysortedset:__rand_key__ __rand_field__ %s:__rand_field__", data);
            benchmark("ZADD",cmd,len);
            free(cmd);
        }

        if (test_is_selected("zrem") && types_is_selected("sortedset")) {
            len = redisFormatCommand(&cmd,"ZREM mysortedset:__rand_key__ %s:__rand_field__", data);
            benchmark("ZREM",cmd,len);
            free(cmd);
        }

        if (test_is_selected("pfadd") && types_is_selected("hyperloglog")) {
            len = redisFormatCommand(&cmd,"PFADD myhll:__rand_key__ %s:__rand_field__", data);
            benchmark("PFADD",cmd,len);
            free(cmd);
        }

        if (test_is_selected("pfcount") && types_is_selected("hyperloglog")) {
            len = redisFormatCommand(&cmd,"PFCOUNT myhll:__rand_key__");
            benchmark("PFCOUNT",cmd,len);
            free(cmd);
        }

        if (test_is_selected("pfmerge") && types_is_selected("hyperloglog")) {
            len = redisFormatCommand(&cmd,"PFADD myhll:__rand_key__ %s:__rand_field__", data);
            benchmark("PFADD (needed to benchmark PFMERGE)",cmd,len);
            free(cmd);
            
            len = redisFormatCommand(&cmd,"PFMERGE myhllm:__rand_key__ myhll:__rand_key__ myhll:__rand_key__");
            benchmark("PFMERGE",cmd,len);
            free(cmd);
        }

        if (!config.csv) printf("\n");
    } while(config.loop);

    return VRT_OK;
}

static int test_memcached(int argc, const char **argv)
{
    int i;
    char *data, *cmd;
    int len;

    /* Run benchmark with command in the remainder of the arguments. */
    if (argc) {
        sds title = sdsnew(argv[0]);
        for (i = 1; i < argc; i++) {
            title = sdscatlen(title, " ", 1);
            title = sdscatlen(title, (char*)argv[i], strlen(argv[i]));
        }

        do {
            len = memcachedFormatCommandArgv(&cmd,argc,argv,NULL);
            if (len < 0) {
                return 0;
            }
            
            benchmark(title,cmd,len);
            free(cmd);
        } while(config.loop);

        return 0;
    }

    /* Run default benchmark suite. */
    data = malloc(config.datasize+1);
    do {
        memset(data,'x',config.datasize);
        data[config.datasize] = '\0';

        if (test_is_selected("set")) {
            len = memcachedFormatCommand(&cmd,"set key:__rand_key__ 0 0 %d %s", config.datasize, data);
            
            benchmark("SET",cmd,len);
            free(cmd);
        }

        if (test_is_selected("get")) {
            len = memcachedFormatCommand(&cmd,"get key:__rand_key__");
            benchmark("GET",cmd,len);
            free(cmd);
        }
        
        if (!config.csv) printf("\n");
    } while(config.loop);

    return VRT_OK;
}

int main(int argc, const char **argv) {
    int i;

    benchmark_client c;

    srandom(time(NULL));
    signal(SIGHUP, SIG_IGN);
    signal(SIGPIPE, SIG_IGN);

    config.numclients = 100;
    config.requests = 1000000;
    config.liveclients = 0;
    config.keepalive = 1;
    config.datasize = 16;
    config.pipeline = 1;
    config.showerrors = 0;
    config.randomkeys = 1;
    config.randomkeys_keyspacelen = 10000;
    config.randomfields = 1;
    config.randomfields_fieldspacelen = 100;
    config.quiet = 0;
    config.csv = 0;
    config.loop = 0;
    config.idlemode = 0;
    config.latency = NULL;
    config.hostip = "127.0.0.1";
    config.hostport = 6379;
    config.hostsocket = NULL;
    config.tests = NULL;
    config.types = NULL;
    config.dbnum = 0;
    config.auth = NULL;
    config.threads_count = 2;
    config.protocol = TEST_CMD_PROTOCOL_REDIS;
    config.noinline = 0;

    i = parseOptions(argc,argv);
    argc -= i;
    argv += i;

    /* Init the benchmark threads */
    if (config.threads_count <= 0) {
        printf("ERROR: threads count need bigger than zero\n");
        return -1;
    }
    if (config.requests <= 0) {
        printf("ERROR: requests count need bigger than zero\n");
        return -1;
    }
    if (config.numclients <= 0) {
        printf("ERROR: clients count need bigger than zero\n");
        return -1;
    }
    if (config.requests < config.numclients) config.numclients = config.requests;
    if (config.requests < config.threads_count) config.threads_count = config.requests;
    if (config.numclients < config.threads_count) config.threads_count = config.numclients;

    config.latency = malloc(sizeof(long long)*config.requests);

    if (config.keepalive == 0) {
        printf("WARNING: keepalive disabled, you probably need 'echo 1 > /proc/sys/net/ipv4/tcp_tw_reuse' for Linux and 'sudo sysctl -w net.inet.tcp.msl=1000' for Mac OS X in order to use a lot of clients/requests\n");
    }

    //if (config.idlemode) {
    //    printf("Creating %d idle connections and waiting forever (Ctrl+C when done)\n", config.numclients);
    //    c = createClient("",0,NULL); /* will never receive a reply */
    //    createMissingClients(c);
    //    aeMain(config.el);
        /* and will wait for every */
    //}

    if (config.protocol == TEST_CMD_PROTOCOL_REDIS) {
        test_redis(argc, argv);
    } else if (config.protocol == TEST_CMD_PROTOCOL_MEMCACHE) {
        test_memcached(argc, argv);
    } else {
        NOT_REACHED();
    }

    return 0;
}


================================================
FILE: tests/vrt_check_data.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <getopt.h>
#include <fcntl.h>
#include <errno.h>
#include <signal.h>
#include <pthread.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <hiredis.h>
#include <async.h>
#include <adapters/ae.h>

#include <dhashkit.h>
#include <dlist.h>
#include <dmtqueue.h>
#include <dlog.h>

#include <vrt_util.h>
#include <vrt_public.h>
#include <vrabtest.h>
#include <vrt_produce_data.h>
#include <vrt_dispatch_data.h>
#include <vrt_backend.h>
#include <vrt_check_data.h>

#define CHECK_DATA_FLAG_NONE        (1<<0)
#define CHECK_DATA_FLAG_MASTER      (1<<1)
#define CHECK_DATA_FLAG_SLAVE       (1<<2)

#define CHECK_UNIT_STATE_NULL           0
#define CHECK_UNIT_STATE_GET_EXPIRE     1
#define CHECK_UNIT_STATE_GET_TYPE       2
#define CHECK_UNIT_STATE_GET_VALUE      3

typedef struct check_data_thread {
    int id;
    pthread_t thread_id;
    
    aeEventLoop *el;
    int hz;
    int cronloops;  /* Number of times the cron function run */

    darray *abgs;   /* Type is abtest_group */
    int scan_group_idx; /* The group idx to scan keys */
    darray *scan_servers;   /* The servers in the scan group, type is abtest_server */
    int scan_finished_count;
    long long cursor;   /* scan cursor */
    dlist *check_units;

    long long check_begin_time; /* Unit is second */
    long long scan_keys_count;
} check_data_thread;

typedef struct check_unit {
    check_data_thread *cdt;

    dlistNode *lnode;
    
    sds key;

    int key_persist;
    long long min_ttl, max_ttl_gap;
    
    int key_type;
    int state;

    darray servers; /* Servers used to send the check messages, type is pointer of abtest_server */
    darray replys;  /* Used to cache the replys from the servers, type is pointer of redisReply */

    unsigned int servers_count;
    unsigned int replys_count;
    unsigned int not_exist_count;
} check_unit;

typedef struct data_checker {
    pthread_t thread_id;
    
    aeEventLoop *el;
    int hz;
    int cronloops;          /* Number of times the cron function run */

    sds test_target_groups;

    int flags;
    sds checker;
    conn_context *master;   /* If this is a slave */

    long long check_begin_time; /* Unit is second */
} data_checker;

static data_checker dc;

/* Last begin time to check the data.
 * Unit is second */
static long long last_check_begin_time;

static darray *cdts = NULL;

static check_unit *check_unit_create(void)
{
    check_unit *cunit;

    cunit = malloc(sizeof(*cunit));
    if (cunit == NULL) {
        return NULL;
    }

    cunit->cdt = NULL;

    cunit->lnode = NULL;
    
    cunit->key = NULL;
    cunit->key_persist = 0;
    cunit->min_ttl = 0;
    cunit->max_ttl_gap = 0;
    cunit->key_type = -1;
    cunit->state = CHECK_UNIT_STATE_NULL;
    darray_init(&cunit->servers, 2, sizeof(abtest_server*));
    darray_init(&cunit->replys, 2, sizeof(redisReply*));

    cunit->servers_count = 0;
    cunit->replys_count = 0;
    cunit->not_exist_count = 0;
    
    return cunit;
}

static void check_unit_destroy(check_unit *cunit)
{
    if (cunit->cdt != NULL && cunit->lnode != NULL) {
        dlistDelNode(cunit->cdt->check_units,cunit->lnode);
        cunit->lnode = NULL;
    }

    if (cunit->key != NULL) {
        sdsfree(cunit->key);
        cunit->key = NULL;
    }

    while (darray_n(&cunit->servers) > 0) {
        darray_pop(&cunit->servers);
    }
    darray_deinit(&cunit->servers);

    while (darray_n(&cunit->replys) > 0) {
        redisReply **reply = darray_pop(&cunit->replys);
        freeReplyObject(*reply);
    }
    darray_deinit(&cunit->replys);

    free(cunit);
}

static int check_conn_context_init(conn_context *cc, char *host, int port)
{
    cc->ctx = NULL;
    cc->actx = NULL;

    cc->actx = redisAsyncConnect(host, port);
    if (cc->actx == NULL) {
        return VRT_ERROR;
    }
    
    return VRT_OK;
}

static void check_conn_context_deinit(conn_context *cc)
{
    if (cc->ctx) {
        redisFree(cc->ctx);
        cc->ctx == NULL;
    }

    if (cc->actx) {
        cc->actx->ev.cleanup = NULL;
        redisAsyncFree(cc->actx);
        cc->actx == NULL;
    }
}

static void connect_callback(const redisAsyncContext *c, int status) {
    check_data_thread *cdt = c->data;
    if (status != REDIS_OK) {
        test_log_out("Error: %s\n", c->errstr);
        //aeStop(loop);
        return;
    }

    //test_log_out("Connected...\n");
}

static void disconnect_callback(const redisAsyncContext *c, int status) {
    check_data_thread *cdt = c->data;
    if (status != REDIS_OK) {
        test_log_out("Error: %s\n", c->errstr);
        //aeStop(loop);
        return;
    }

    //test_log_out("Disconnected...\n");
    //aeStop(loop);
}

static int sort_replys_if_needed(check_unit *cunit)
{
    int step = 0, idx_cmp = 0;

    if (cunit->key_type == REDIS_SET) {
        step = 1;
    } else if (cunit->key_type == REDIS_HASH) {
        step = 2;
    }

    if (step > 0) {
        int i;
        redisReply **reply;
        for (i = 0; i < darray_n(&cunit->replys); i ++) {
            reply = darray_get(&cunit->replys, i);
            if ((*reply)->type != REDIS_REPLY_ARRAY)
                continue;
            sort_array_by_step((*reply)->element, (*reply)->elements, 
                step, idx_cmp, reply_string_binary_compare);
        }
    }
    
    return VRT_OK;
}

/* 1: All replys are same
 * 0: replys are different */
static int check_replys_if_same(check_unit *cunit)
{
    unsigned int j;
    redisReply **replyb, **reply;

    sort_replys_if_needed(cunit);

    replyb = darray_get(&cunit->replys,0);
    
    for (j = 1; j < cunit->replys_count ; j ++) {
        reply = darray_get(&cunit->replys,j);
        if (check_two_replys_if_same(*replyb, *reply)) {
            return 0;
        }
    }
    
    return 1;
}

#define TTL_MISTAKE_CAN_BE_ACCEPT   3
static void check_data_callback(redisAsyncContext *c, void *r, void *privdata) {
    redisReply *reply = r, *reply_sub, *reply_elem;
    redisReply *reply_clone, **elem;
    check_unit *cunit = privdata;
    check_data_thread *cdt = cunit->cdt;
    conn_context *cc;
    long long value;
    char *errmsg;
    int j;
    
    if (reply == NULL) return;

    if (cunit->state == CHECK_UNIT_STATE_GET_EXPIRE) {
        if (reply->type != REDIS_REPLY_INTEGER) {
            errmsg = "ttl command reply type is not integer";
            goto error;
        }

        reply_clone = steal_hiredis_redisreply(reply);
        elem = darray_push(&cunit->replys);
        *elem = reply_clone;
        cunit->replys_count ++;
        
        if (cunit->replys_count >= cunit->servers_count) {
            char *argv[2];
            size_t argvlen[2];
            long long min, max;
            int persist;

            elem = darray_get(&cunit->replys, 0);
            reply_elem = *elem;
            if (reply_elem->integer == -1) {
                persist = 1;
            } else if (reply_elem->integer == -2) {
                cunit->not_exist_count ++;
                min = max = 0;
            } else if (reply_elem->integer < -2) {
                errmsg = "ttl command reply integer is less than -2";
                goto error;
            } else {
                min = max =  reply_elem->integer;
            }
            
            for (j = 1; j < darray_n(&cunit->replys); j ++) {
                elem = darray_get(&cunit->replys, j);
                reply_elem = *elem;
                if (persist && reply_elem->integer != -1) {
                    errmsg = "key in some server is persist, but others are not";
                    goto error;
                }
                
                if (reply_elem->integer == -1) {
                    if (persist != 1) {
                        errmsg = "key in some server is persist, but others are not";
                        goto error;
                    }
                } else if (reply_elem->integer == -2) {
                    cunit->not_exist_count ++;
                    if (min > 0) min = 0;
                } else if (reply_elem->integer < -2) {
                    errmsg = "ttl command reply integer is less than -2";
                    goto error;
                } else {
                    if (reply_elem->integer < min) min = reply_elem->integer;
                    if (reply_elem->integer > max) max = reply_elem->integer;
                }
            }

            if (cunit->not_exist_count >= cunit->servers_count) {
                /* The key in all the target group is expired */
                goto done;
            }
            
            if (persist) {
                cunit->key_persist = 1;
            } else {
                cunit->min_ttl = min;
                cunit->max_ttl_gap = max-min;
                if (cunit->max_ttl_gap > TTL_MISTAKE_CAN_BE_ACCEPT) {
                    errmsg = "ttl mistake is too big between groups";
                    goto error;
                }
            }
            
            /* Check step 2: get the key type */
            argv[0] = "type";
            argvlen[0] = 4;
            argv[1] = cunit->key;
            argvlen[1] = sdslen(cunit->key);
            for (j = 0; j < darray_n(&cunit->servers); j ++) {
                abtest_server **abs = darray_get(&cunit->servers,j);
                conn_context *cc = darray_get((*abs)->conn_contexts, 0);
                
                redisAsyncCommandArgv(cc->actx, check_data_callback, 
                    cunit, 2, argv, argvlen);
            }
            
            cunit->state = CHECK_UNIT_STATE_GET_TYPE;
            goto next_step;
        }

        return;
    }

    if (cunit->state == CHECK_UNIT_STATE_GET_TYPE) {        
        if (reply->type != REDIS_REPLY_STATUS) {
            errmsg = "type command reply type is not status";
            goto error;
        }

        if (!strcmp(reply->str, "none")) {
            /* This key doesn't exit, may be expired or evicted */
            cunit->not_exist_count ++;
        } else {
            reply_clone = steal_hiredis_redisreply(reply);
            elem = darray_push(&cunit->replys);
            *elem = reply_clone;
            cunit->replys_count ++;
        }

        if (cunit->not_exist_count >= cunit->servers_count) {
            /* The key in all the target group is expired */
            goto done;
        } else if (cunit->replys_count >= (cunit->servers_count-cunit->not_exist_count)) {
            int argc;
            char **argv;
            size_t *argvlen;

            if (cunit->not_exist_count > 0 && cunit->key_persist) {
                errmsg = "key is persist, but not exist in some servers";
                goto error;
            }
            
            if (check_replys_if_same(cunit) != 1) {
                errmsg = "type command replys are not same";
                goto error;
            }

            elem = darray_get(&cunit->replys,0);
            if (!strcmp((*elem)->str,"string")) {
                cunit->key_type = REDIS_STRING;
                
                argc = 2;
                argv = malloc(argc*sizeof(char *));
                argvlen = malloc(argc*sizeof(size_t));

                argv[0] = "get";
                argvlen[0] = 3;
                argv[1] = cunit->key;
                argvlen[1] = sdslen(cunit->key);
            } else if (!strcmp((*elem)->str,"list")) {
                cunit->key_type = REDIS_LIST;

                argc = 4;
                argv = malloc(argc*sizeof(char *));
                argvlen = malloc(argc*sizeof(size_t));

                argv[0] = "lrange";
                argvlen[0] = 6;
                argv[1] = cunit->key;
                argvlen[1] = sdslen(cunit->key);
                argv[2] = "0";
                argvlen[2] = 1;
                argv[3] = "-1";
                argvlen[3] = 2;
            } else if (!strcmp((*elem)->str,"set")) {
                cunit->key_type = REDIS_SET;

                argc = 2;
                argv = malloc(argc*sizeof(char *));
                argvlen = malloc(argc*sizeof(size_t));

                argv[0] = "smembers";
                argvlen[0] = 8;
                argv[1] = cunit->key;
                argvlen[1] = sdslen(cunit->key);
            } else if (!strcmp((*elem)->str,"zset")) {
                cunit->key_type = REDIS_ZSET;

                argc = 4;
                argv = malloc(argc*sizeof(char *));
                argvlen = malloc(argc*sizeof(size_t));

                argv[0] = "zrange";
                argvlen[0] = 6;
                argv[1] = cunit->key;
                argvlen[1] = sdslen(cunit->key);
                argv[2] = "0";
                argvlen[2] = 1;
                argv[3] = "-1";
                argvlen[3] = 2;
            } else if (!strcmp((*elem)->str,"hash")) {
                cunit->key_type = REDIS_HASH;

                argc = 2;
                argv = malloc(argc*sizeof(char *));
                argvlen = malloc(argc*sizeof(size_t));

                argv[0] = "hgetall";
                argvlen[0] = 7;
                argv[1] = cunit->key;
                argvlen[1] = sdslen(cunit->key);
            } else {
                errmsg = "not supported key type";
                goto error;
            }

            /* Check step 3: get the value */
            for (j = 0; j < darray_n(&cunit->servers); j ++) {
                abtest_server **abs = darray_get(&cunit->servers,j);
                conn_context *cc = darray_get((*abs)->conn_contexts, 0);
                
                redisAsyncCommandArgv(cc->actx, check_data_callback, 
                    cunit, argc, argv, argvlen);
            }
            free(argv);
            free(argvlen);
            
            cunit->state = CHECK_UNIT_STATE_GET_VALUE;
            goto next_step;
        }

        return;
    }

    if (cunit->state == CHECK_UNIT_STATE_GET_VALUE) {
        int not_exist = 0;
        if (cunit->key_type == REDIS_STRING) {
            if (reply->type == REDIS_REPLY_NIL) {
                not_exist = 1;
            } else if (reply->type != REDIS_REPLY_STRING) {
                errmsg = "get command reply type is not string";
                goto error;
            }
        } else if (cunit->key_type == REDIS_LIST) {
            if (reply->type != REDIS_REPLY_ARRAY) {
                errmsg = "lrange command reply type is not array";
                goto error;
            }
            if (reply->elements == 0) {
                not_exist = 1;
            }
        } else if (cunit->key_type == REDIS_SET) {
            if (reply->type != REDIS_REPLY_ARRAY) {
                errmsg = "smembers command reply type is not array";
                goto error;
            }
            if (reply->elements == 0) {
                not_exist = 1;
            }
        } else if (cunit->key_type == REDIS_ZSET) {
            if (reply->type != REDIS_REPLY_ARRAY) {
                errmsg = "zrange command reply type is not array";
                goto error;
            }
            if (reply->elements == 0) {
                not_exist = 1;
            }
        } else if (cunit->key_type == REDIS_HASH) {
            if (reply->type != REDIS_REPLY_ARRAY) {
                errmsg = "hgetall command reply type is not array";
                goto error;
            }
            if (reply->elements == 0) {
                not_exist = 1;
            }
        } else {
            errmsg = "not supported key type";
            goto error;
        }

        if (not_exist) {
            cunit->not_exist_count ++;
        } else {
            reply_clone = steal_hiredis_redisreply(reply);
            elem = darray_push(&cunit->replys);
            *elem = reply_clone;
            cunit->replys_count ++;
        }

        if (cunit->not_exist_count >= cunit->servers_count) {
            /* The key in all the target group is expired */
            goto done;
        } else if (cunit->replys_count >= (cunit->servers_count-cunit->not_exist_count)) {
            if (cunit->not_exist_count > 0 && cunit->key_persist) {
                errmsg = "key is persist, but not exist in some servers";
                goto error;
            }
        
            if (check_replys_if_same(cunit) != 1) {
                errmsg = "values for reply are not same";
                goto error;
            }
            
            goto done;
        }

        return;
    }

done:

    check_unit_destroy(cunit);
    
    return;
    
next_step:

    cunit->replys_count = 0;
    cunit->not_exist_count = 0;
    while (darray_n(&cunit->replys) > 0) {
        elem = darray_pop(&cunit->replys);
        freeReplyObject(*elem);
    }
    
    return;
    
error:

    log_hexdump(LOG_ERR,cunit->key,sdslen(cunit->key),
        "%s, scan group id: %d, key(len:%zu, type: %s): ", 
        errmsg, 
        cdt->scan_group_idx, 
        sdslen(cunit->key),get_key_type_string(cunit->key_type));
    
    check_unit_destroy(cunit);
}

static int start_check_data(char *key, size_t keylen, check_data_thread *cdt)
{
    check_unit *cu = check_unit_create();
    int j;

    cu->cdt = cdt;
    cu->key = sdsnewlen(key,keylen);
    dlistPush(cdt->check_units,cu);
    cu->lnode = dlistLast(cdt->check_units);

    for (j = 0; j < darray_n(cdt->abgs); j ++) {
        abtest_group *abg = darray_get(cdt->abgs, j);
        abtest_server *abs = abg->get_backend_server(abg,key,keylen);
        abtest_server **elem = darray_push(&cu->servers);
        conn_context *cc = darray_get(abs->conn_contexts, 0);
        char *argv[2];
        size_t argvlen[2];
        
        *elem = abs;
        cu->servers_count ++;

        /* Check step 1: get the expire */
        argv[0] = "ttl";
        argvlen[0] = 3;
        argv[1] = key;
        argvlen[1] = keylen;
        redisAsyncCommandArgv(cc->actx, check_data_callback, 
            cu, 2, argv, argvlen);
    }
    cu->state = CHECK_UNIT_STATE_GET_EXPIRE;

    return VRT_OK;
}

static void scan_for_check_callback(redisAsyncContext *c, void *r, void *privdata) {
    redisReply *reply = r, *reply_sub, *reply_elem;
    abtest_server *abs = privdata;
    check_data_thread *cdt = abs->data;
    conn_context *cc;
    long long value;
    size_t k;
    
    if (reply == NULL) return;


    if (reply->type != REDIS_REPLY_ARRAY) {
        return;
    }

    if (reply->elements != 2) {
        return;
    }

    reply_sub = reply->element[0];
    if (reply_sub->type != REDIS_REPLY_STRING || 
        string2ll(reply_sub->str,reply_sub->len,&value) != 1) {
        return;
    }

    cdt->cursor = value;

    reply_sub = reply->element[1];
    if (reply_sub->type != REDIS_REPLY_ARRAY) {
        return;
    }

    for (k = 0; k < reply_sub->elements; k ++) {
        reply_elem = reply_sub->element[k];
        if (reply_elem->type != REDIS_REPLY_STRING) {
            return;
        }

        start_check_data(reply_elem->str,reply_elem->len,cdt);
    }

    cdt->scan_keys_count += reply_sub->elements;

    if (cdt->cursor == 0) {
        cdt->scan_finished_count ++;
    }
}

static int check_data_threads_finished_count = 0;
static void one_check_data_thread_finished(void)
{
    update_state_add(check_data_threads_finished_count,1);
}

static int all_check_data_threads_finished(void)
{
    int finished_count;
    update_state_get(check_data_threads_finished_count,&finished_count);

    if (finished_count >= darray_n(cdts)) {
        return 1;
    }

    return 0;
}

static int check_data_thread_cron(aeEventLoop *eventLoop, long long id, void *clientData)
{
    check_data_thread *cdt = clientData;

    ASSERT(eventLoop == cdt->el);

    if (cdt->scan_finished_count >= darray_n(cdt->scan_servers)) {
        if (dlistLength(cdt->check_units) == 0) {
            aeStop(cdt->el);
            one_check_data_thread_finished();
            log_debug(LOG_NOTICE, "One check thread finished,scaned %lld keys",
                cdt->scan_keys_count);
            return 1;
        }
    } else if (dlistLength(cdt->check_units) < 3000) {
        abtest_group *abg;
        abtest_server **abs;
        int *idx;
        conn_context *cc;
        
        abg = darray_get(cdt->abgs, cdt->scan_group_idx);
        abs = darray_get(cdt->scan_servers, cdt->scan_finished_count);
        cc = darray_get((*abs)->conn_contexts, 0);

        redisAsyncCommand(cc->actx, scan_for_check_callback, 
            *abs, "scan %lld count 1000", cdt->cursor);
    }

    cdt->cronloops ++;
    return 1000/cdt->hz;
}

static int check_data_thread_init(check_data_thread *cdt, char *test_target_groups)
{
    int i, j, k;

    cdt->id = 0;
    cdt->thread_id = 0;
    cdt->el = NULL;
    cdt->hz = 200;
    cdt->cronloops = 0;
    
    cdt->abgs = NULL;
    cdt->scan_group_idx = 0;
    cdt->scan_servers = NULL;
    cdt->scan_finished_count = 0;
    cdt->cursor = 0;
    cdt->check_units = NULL;

    cdt->check_begin_time = 0;
    cdt->scan_keys_count = 0;

    cdt->el = aeCreateEventLoop(200);
    if (cdt->el == NULL) {
        return VRT_ERROR;
    }

    cdt->scan_servers = darray_create(1,sizeof(abtest_server*));
    
    cdt->abgs = abtest_groups_create(test_target_groups);
    if (cdt->abgs == NULL) {
        return VRT_ERROR;
    }

    /* Init connection context for each server */
    for (i = 0; i < darray_n(cdt->abgs); i ++) {
        abtest_group *abg = darray_get(cdt->abgs, i);
        for (j = 0; j < darray_n(&abg->abtest_servers); j ++) {
            abtest_server *abs = darray_get(&abg->abtest_servers, j);
            abs->conn_contexts = darray_create(1, sizeof(conn_context));
            for (k = 0; k < 1; k ++) {
                conn_context *cc = darray_push(abs->conn_contexts);
                if (check_conn_context_init(cc,abs->host,abs->port) != VRT_OK) {
                    return VRT_ERROR;
                }
                cc->actx->data = cdt;
                redisAeAttach(cdt->el, cc->actx);
                redisAsyncSetConnectCallback(cc->actx,connect_callback);
                redisAsyncSetDisconnectCallback(cc->actx,disconnect_callback);
            }
        }
    }

    if (aeCreateTimeEvent(cdt->el, 1, check_data_thread_cron, cdt, NULL) == AE_ERR) {
        return VRT_ERROR;
    }

    cdt->check_units = dlistCreate();
    
    return VRT_OK;
}

static void check_data_thread_deinit(check_data_thread *cdt)
{
    if (cdt->el) {
        aeDeleteEventLoop(cdt->el);
        cdt->el = NULL;
    }

    if (cdt->scan_servers) {
        while (darray_n(cdt->scan_servers) > 0) {
            darray_pop(cdt->scan_servers);
        }
        darray_destroy(cdt->scan_servers);
        cdt->scan_servers = NULL;
    }

    if (cdt->abgs) {
        int i, j, k;
        /* Deinit connection context for each server */
        for (i = 0; i < darray_n(cdt->abgs); i ++) {
            abtest_group *abg = darray_get(cdt->abgs, i);
            for (j = 0; j < darray_n(&abg->abtest_servers); j ++) {
                abtest_server *abs = darray_get(&abg->abtest_servers, j);
                while (darray_n(abs->conn_contexts) > 0) {
                    conn_context *cc = darray_pop(abs->conn_contexts);
                    check_conn_context_deinit(cc);
                }
            }
        }
        
        abtest_groups_destroy(cdt->abgs);
        cdt->abgs = NULL;
    }

    if (cdt->check_units) {
        while (dlistLength(cdt->check_units) > 0) {
            check_unit *cu = dlistPop(cdt->check_units);
            check_unit_destroy(cu);
        }
        dlistRelease(cdt->check_units);
        cdt->check_units = NULL;
    }
}

static int checking_data;
static int checking_data_or_not(void)
{
    int checking;

    update_state_get(checking_data,&checking);

    if (checking) return 1;
    else return 0;
}

static int check_data_threads_count = 8;
static void destroy_check_data_threads(void);
/* return value :
 * -1: error
 * 0 : ok
 * 1 : not need */
static int create_check_data_threads(void)
{
    darray *abgs = NULL;
    abtest_group *abg;
    int groups_count;
    int threads_count_per_group;
    int check_thread_id = 0;
    int i, j, k;
    
    if (cdts != NULL) {
        destroy_check_data_threads();
    }

    cdts = darray_create(2,sizeof(check_data_thread));
    if (cdts == NULL) {
        return -1;
    }

    abgs = abtest_groups_create(dc.test_target_groups);
    if (abgs == NULL) {
        return -1;
    }

    groups_count = darray_n(abgs);
    if (groups_count == 1) {
        abtest_groups_destroy(abgs);
        return 1;
    }

    threads_count_per_group = check_data_threads_count/groups_count;
    if (threads_count_per_group <= 0) {
        threads_count_per_group = 1;
    }
    
    for (i = 0; i < groups_count; i ++) {
        int servers_count, threads_count;
        int servers_count_per_thread;
        int server_idx = 0;

        threads_count = threads_count_per_group;
        abg = darray_get(abgs, i);
        servers_count = darray_n(&abg->abtest_servers);
        servers_count_per_thread = servers_count/threads_count;
        if (servers_count_per_thread == 0) {
            servers_count_per_thread = 1;
            threads_count = servers_count;
        }
        for (j = 0; j < threads_count; j ++) {
            abtest_server *abs;
            
            check_data_thread *cdt = darray_push(cdts);
            check_data_thread_init(cdt,dc.test_target_groups);
            cdt->id = check_thread_id++;
            cdt->scan_group_idx = i;

            abg = darray_get(cdt->abgs, cdt->id);
            
            for (k = 0; k < servers_count_per_thread; k ++) {
                abtest_server **elem = darray_push(cdt->scan_servers);
                abs = darray_get(&abg->abtest_servers, server_idx++);
                abs->data = cdt;
                *elem = abs;
            }

            if (j == threads_count-1) {
                while (server_idx < servers_count) {
                    abtest_server **elem = darray_push(cdt->scan_servers);
                    abs = darray_get(&abg->abtest_servers, server_idx++);
                    abs->data = cdt;
                    *elem = abs;
                }
            }
        }
    }
    
    abtest_groups_destroy(abgs);
    
    return 0;
}

static void destroy_check_data_threads(void)
{
    if (cdts != NULL) {
        while (darray_n(cdts) > 0) {
            check_data_thread *cdt = darray_pop(cdts);
            check_data_thread_deinit(cdt);
        }
        darray_destroy(cdts);
        cdts = NULL;
    }
}

static void *check_data_thread_run(void *args)
{
    check_data_thread *cdt = args;
    
    srand(vrt_usec_now()^(int)pthread_self());

    aeMain(cdt->el);
    
    return NULL;
}

static int start_check_data_threads(void)
{
    int j;
    check_data_thread *cdt;

    if (cdts == NULL) return VRT_ERROR;

    for (j = 0; j < darray_n(cdts); j ++) {
        pthread_attr_t attr;
        
        cdt = darray_get(cdts, j);
        pthread_attr_init(&attr);
        pthread_create(&cdt->thread_id, 
            &attr, check_data_thread_run, cdt);  
    }
    
    return VRT_OK;
}

static int begin_check_data(void)
{
    create_check_data_threads();
    start_check_data_threads();
    
    update_state_set(checking_data,1);

    return VRT_OK;
}

static void end_check_data(void)
{
    update_state_set(check_data_threads_finished_count,0);
    update_state_set(checking_data,0);
}

static int data_checker_cron(aeEventLoop *eventLoop, long long id, void *clientData)
{
    ASSERT(eventLoop == dc.el);

    if (!test_if_need_pause() && vrt_sec_now()-last_test_begin_time > test_interval) {
        test_need_to_pause();
        log_notice("Start pause the test...");
    }

    if (!checking_data_or_not() && test_if_need_pause() && 
        all_threads_paused()) {
        
        log_notice("Finished pause the test. Tested %lld commands, %lld error reply(%.2f%%).", 
            get_total_tested_commands_count_per_cycle(),
            get_total_reply_err_count_per_cycle(),
            (float)get_total_reply_err_count_per_cycle()/(float)get_total_tested_commands_count_per_cycle()*100);
        reset_total_count_per_cycle();
        sleep(1);
        last_check_begin_time = vrt_sec_now();
        begin_check_data();
        log_notice("Start checking the data...");
    }

    if (checking_data_or_not() && all_check_data_threads_finished()) {
        end_check_data();
        log_notice("Finished checking the data\n");
        test_can_continue();
        last_test_begin_time = vrt_sec_now();
    }

    dc.cronloops ++;
    return 1000/dc.hz;
}

int vrt_data_checker_init(char *checker, char *test_target_groups)
{
    int ret;
    
    dc.thread_id = 0;
    dc.el = NULL;
    dc.hz = 10;
    dc.cronloops = 0;
    dc.test_target_groups = NULL;
    dc.flags = CHECK_DATA_FLAG_NONE;
    dc.checker = NULL;
    dc.master = NULL;
    dc.check_begin_time = 0;
    
    dc.el = aeCreateEventLoop(10);
    if (dc.el == NULL) {
        return VRT_ERROR;
    }

    if (aeCreateTimeEvent(dc.el, 1, data_checker_cron, NULL, NULL) == AE_ERR) {
        return VRT_ERROR;
    }

    dc.test_target_groups = sdsnew(test_target_groups);

    dc.checker = sdsnew(checker);

    if (!strcasecmp(checker,"myself")) {
        dc.flags |= CHECK_DATA_FLAG_MASTER;
    } else {
        sds host;
        int port;
        dc.flags |= CHECK_DATA_FLAG_SLAVE;
        host = get_host_port_from_address_string(checker, &port);
        if (host == NULL) {
            return VRT_ERROR;
        }
        dc.master = malloc(sizeof(conn_context));
        ret = check_conn_context_init(dc.master, host, port);
        sdsfree(host);
        if (ret != VRT_OK) {
            return VRT_ERROR;
        }
    }

    return VRT_OK;
}

void vrt_data_checker_deinit(void)
{
    if (dc.el) {
        aeDeleteEventLoop(dc.el);
        dc.el = NULL;
    }

    if (dc.test_target_groups) {
        sdsfree(dc.test_target_groups);
        dc.test_target_groups = NULL;
    }

    if (dc.checker) {
        sdsfree(dc.checker);
        dc.checker = NULL;
    }

    if (dc.master) {
        check_conn_context_deinit(dc.master);
        free(dc.master);
        dc.master = NULL;
    }

    destroy_check_data_threads();
}

static void *vrt_data_checker_run(void *args)
{
    srand(vrt_usec_now()^(int)pthread_self());

    aeMain(dc.el);
    
    return NULL;
}

int vrt_start_data_checker(void)
{
    pthread_attr_t attr;
    pthread_attr_init(&attr);
    pthread_create(&dc.thread_id, 
        &attr, vrt_data_checker_run, NULL);   
    return VRT_OK;
}

int vrt_wait_data_checker(void)
{
	pthread_join(dc.thread_id, NULL);
   
    return VRT_OK;
}

static int test_need_pause = 0;

int test_if_need_pause(void)
{
    int need_pause;

    update_state_get(test_need_pause,&need_pause);

    if (need_pause) return 1;
    else return 0;
}

void test_can_continue(void)
{
     update_state_set(test_need_pause,0);
     update_state_set(produce_threads_pause_finished_count,0);
     update_state_set(dispatch_threads_pause_finished_count,0);
     update_state_set(backend_threads_pause_finished_count,0);
}

void test_need_to_pause(void)
{
    update_state_set(test_need_pause,1);
}

void one_produce_thread_paused(void)
{
    update_state_add(produce_threads_pause_finished_count,1);
}

void one_dispatch_thread_paused(void)
{
    update_state_add(dispatch_threads_pause_finished_count,1);
}

void one_backend_thread_paused(void)
{
    update_state_add(backend_threads_pause_finished_count,1);
}

int all_produce_threads_paused(void)
{
    int paused_threads;

    update_state_get(produce_threads_pause_finished_count,&paused_threads);
    if (paused_threads < produce_data_threads_count) {
        return 0;
    }

    return 1;
}

int all_dispatch_threads_paused(void)
{
    int paused_threads;

    update_state_get(dispatch_threads_pause_finished_count,&paused_threads);
    if (paused_threads < dispatch_data_threads_count) {
        return 0;
    }

    return 1;
}

int all_backend_threads_paused(void)
{
    int paused_threads;

    update_state_get(backend_threads_pause_finished_count,&paused_threads);
    if (paused_threads < backend_threads_count) {
        return 0;
    }

    return 1;
}

int all_threads_paused(void)
{
    int paused_threads;

    update_state_get(produce_threads_pause_finished_count,&paused_threads);
    if (paused_threads < produce_data_threads_count) {
        return 0;
    }

    update_state_get(dispatch_threads_pause_finished_count,&paused_threads);
    if (paused_threads < dispatch_data_threads_count) {
        return 0;
    }

    update_state_get(backend_threads_pause_finished_count,&paused_threads);
    if (paused_threads < backend_threads_count) {
        return 0;
    }

    return 1;
}


================================================
FILE: tests/vrt_check_data.h
================================================
#ifndef _VRT_CHECK_DATA_H_
#define _VRT_CHECK_DATA_H_

int vrt_data_checker_init(char *checker, char *test_target_groups);
void vrt_data_checker_deinit(void);

int vrt_start_data_checker(void);
int vrt_wait_data_checker(void);

int test_if_need_pause(void);
void test_can_continue(void);
void test_need_to_pause(void);

void one_produce_thread_paused(void);
void one_dispatch_thread_paused(void);
void one_backend_thread_paused(void);

int all_produce_threads_paused(void);
int all_dispatch_threads_paused(void);
int all_backend_threads_paused(void);
int all_threads_paused(void);

#endif


================================================
FILE: tests/vrt_dispatch_data.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <getopt.h>
#include <fcntl.h>
#include <errno.h>
#include <signal.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <hiredis.h>
#include <async.h>
#include <adapters/ae.h>

#include <dhashkit.h>
#include <dlist.h>
#include <dmtqueue.h>
#include <dlog.h>

#include <vrt_util.h>
#include <vrt_public.h>
#include <vrabtest.h>
#include <vrt_dispatch_data.h>
#include <vrt_produce_data.h>

int dispatch_data_threads_count;
static darray *dispatch_data_threads = NULL;

int dispatch_threads_pause_finished_count;

static long long total_tested_commands_count_per_cycle = 0;
static long long total_reply_err_count_per_cycle = 0;
static long long total_tested_commands_count = 0;
static long long total_reply_err_count = 0;

long long get_total_tested_commands_count_per_cycle(void)
{
    long long count;
    update_state_get(total_tested_commands_count_per_cycle,&count);
    return count;
}

long long get_total_reply_err_count_per_cycle(void)
{
    long long count;
    update_state_get(total_reply_err_count_per_cycle,&count);
    return count;
}

void reset_total_count_per_cycle(void)
{
    update_state_set(total_tested_commands_count_per_cycle,0);
    update_state_set(total_reply_err_count_per_cycle,0);
}

typedef struct reply_unit {
    int total_count;
    int received_count;
    redisReply **replys;
    data_unit *du;
} reply_unit;

static void show_replys_inconsistency_msg(data_unit *du, redisReply *reply1, redisReply *reply2)
{
    int *keyindex, numkeys;
    sds key = NULL;

    keyindex = get_keys_from_data_producer(du->dp, du->argv, du->argc, &numkeys);
    if (numkeys > 0) {
        key = du->argv[keyindex[0]];
    }
    free(keyindex);

    if (key) {
        log_hexdump(LOG_ERR,key,sdslen(key),
            "%s command replys are inconsistency, "
            "reply type: %d %d, "
            "reply status: %s %s, "
            "reply error: %s %s, "
            "reply integer: %lld %lld, "
            "reply array len: %zu %zu, "
            "key(len:%zu): ", 
            du->dp->name, 
            reply1->type, reply2->type, 
            reply1->type==REDIS_REPLY_STATUS?reply1->str:"NULL",
            reply2->type==REDIS_REPLY_STATUS?reply2->str:"NULL",
            reply1->type==REDIS_REPLY_ERROR?reply1->str:"NULL",
            reply2->type==REDIS_REPLY_ERROR?reply2->str:"NULL",
            reply1->type==REDIS_REPLY_INTEGER?reply1->integer:0,
            reply2->type==REDIS_REPLY_INTEGER?reply2->integer:0,
            reply1->type==REDIS_REPLY_ARRAY?reply1->elements:0,
            reply2->type==REDIS_REPLY_ARRAY?reply2->elements:0,
            sdslen(key));
    } else {
        log_error("%s command replys are inconsistency, "
            "reply type: %d %d, "
            "reply status: %s %s, "
            "reply error: %s %s, "
            "reply integer: %lld %lld, "
            "reply array len: %zu %zu",
            du->dp->name,
            reply1->type, reply2->type, 
            reply1->type==REDIS_REPLY_STATUS?reply1->str:"NULL",
            reply2->type==REDIS_REPLY_STATUS?reply2->str:"NULL",
            reply1->type==REDIS_REPLY_ERROR?reply1->str:"NULL",
            reply2->type==REDIS_REPLY_ERROR?reply2->str:"NULL",
            reply1->type==REDIS_REPLY_INTEGER?reply1->integer:0,
            reply2->type==REDIS_REPLY_INTEGER?reply2->integer:0,
            reply1->type==REDIS_REPLY_ARRAY?reply1->elements:0,
            reply2->type==REDIS_REPLY_ARRAY?reply2->elements:0);
    }

}

static int sort_replys_if_needed(reply_unit *ru)
{
    data_unit *du = ru->du;
    data_producer *dp = du->dp;
    int step = 0, idx_cmp = 0;

    if (dp->cmd_type&TEST_CMD_TYPE_SET) {
        if (!strcmp(dp->name,"smembers") || 
            !strcmp(dp->name,"sunion") || 
            !strcmp(dp->name,"sdiff") || 
            !strcmp(dp->name,"sinter")) {
            step = 1;
        }
    } else if (dp->cmd_type&TEST_CMD_TYPE_HASH) {
        if (!strcmp(dp->name,"hkeys") || 
            !strcmp(dp->name,"hvals")) {
            step = 1;
        } else if (!strcmp(dp->name,"hgetall")) {
            step = 2;
            idx_cmp = 0;
        }
    }

    if (step > 0) {
        int i;
        redisReply *reply;
        for (i = 0; i < ru->received_count; i ++) {
            reply = ru->replys[i];
            if (reply->type != REDIS_REPLY_ARRAY)
                continue;
            sort_array_by_step(reply->element, reply->elements, 
                step, idx_cmp, reply_string_binary_compare);
        }
    }
    
    return VRT_OK;
}

static int check_replys_if_same(reply_unit *ru)
{
    int j;
    redisReply **replys = ru->replys;
    redisReply *replyb, *reply;

    sort_replys_if_needed(ru);

    replyb = replys[0];
    
    for (j = 1; j < ru->total_count ; j ++) {
        reply = replys[j];
        if (check_two_replys_if_same(replyb, reply)) {
            show_replys_inconsistency_msg(ru->du, replyb, reply);
            return 0;
        }
    }
    
    return 1;
}

struct callback_data {
    dispatch_data_thread *ddt;
    reply_unit *ru;
    int idx;
};

static void reply_callback(redisAsyncContext *c, void *r, void *privdata) {
    int ret;
    redisReply *reply;
    struct callback_data *cbd = privdata;
    dispatch_data_thread *ddt = cbd->ddt;
    reply_unit *ru = cbd->ru;
    
    if (r == NULL) {
        reply = NULL;
    } else {
        /* Beacause reply will be freed by hiredis in async way. */
        reply = steal_hiredis_redisreply(r);
    }

    ru->replys[cbd->idx] = reply;
    ru->received_count ++;
    free(cbd);

    if (ru->received_count >= ru->total_count) {
        int j;
        
        ret = check_replys_if_same(ru);
        if (ret == 1 && reply != NULL) {
            data_unit *du = ru->du;
            data_producer *dp = du->dp;
            if (reply->type == REDIS_REPLY_ERROR) {
                ddt->reply_type_err_count_per_cycle++;
            }

            /* Cache this key if needed. */
            if (dp->need_cache_key_proc != NULL) {
                produce_scheme *ps = du->data;
                if (dp->need_cache_key_proc(reply)) {
                    key_cache_array *kcp = kcp_get_from_ps(ps, dp);
                    sds key = get_one_key_from_data_unit(du);
                    key_cache_array_input(kcp,key,sdslen(key));
                }
            }
        }

        /* release the reply_unit */
        for (j = 0; j < ru->total_count; j ++) {
            freeReplyObject(ru->replys[j]);
            ru->replys[j] = NULL;
        }
        free(ru->replys);
        data_unit_put(ru->du);
        free(ru);
        
        ddt->count_wait_for_reply --;
        ASSERT(ddt->count_wait_for_reply >= 0);
        
        ddt->reply_total_count_per_cycle++;
    }
}

static int dispatch_thread_send_data(dispatch_data_thread *ddt)
{
    int count_per_time = 1000;
    data_unit *du;

    while ((du = dmtqueue_pop(ddt->datas)) != NULL) {
        redisAsyncContext *actx;
        int j;
        
        size_t *argvlen = malloc(du->argc*sizeof(size_t));
        reply_unit *ru = malloc(sizeof(reply_unit));
        ru->du = du;
        ru->total_count = darray_n(ddt->abgs);
        ru->received_count = 0;
        ru->replys = malloc(ru->total_count*sizeof(redisReply *));
        for (j = 0; j < du->argc; j ++) {
            argvlen[j] = sdslen(du->argv[j]);
        }
        for (j = 0; j < darray_n(ddt->abgs); j ++) {
            struct callback_data *cbd;
            int *keyindex, numkeys;
            abtest_server *abs;

            cbd = malloc(sizeof(struct callback_data));
            cbd->ddt = ddt;
            cbd->ru = ru;
            cbd->idx = j;
            abtest_group *abg = darray_get(ddt->abgs, j);

            keyindex = get_keys_from_data_producer(du->dp, du->argv, du->argc, &numkeys);
            if (numkeys == 0) {
                unsigned int idx;
                idx = (unsigned int)rand()%darray_n(&abg->abtest_servers);
                abs = darray_get(&abg->abtest_servers,idx);
            } else {
                sds key = du->argv[keyindex[0]];
                abs = abg->get_backend_server(abg,key,sdslen(key));
            }
            free(keyindex);
            
            conn_context *cc = darray_get(abs->conn_contexts, 
                du->hashvalue%darray_n(abs->conn_contexts));
            actx = cc->actx;
            redisAsyncCommandArgv(actx, reply_callback, cbd, du->argc, du->argv, argvlen);
        }
        free(argvlen);

        ddt->count_wait_for_reply ++;
        
        if (count_per_time-- <= 0) break;
    }

    return VRT_OK;
}

static int dispatch_data_thread_cron(aeEventLoop *eventLoop, long long id, void *clientData)
{
    dispatch_data_thread *ddt = clientData;

    ASSERT(eventLoop == ddt->el);

    /* At the begin of this loop */
    if (ddt->pause) {
        if (!test_if_need_pause()) {
            ddt->pause = 0;
        } else {
            ddt->cronloops ++;
            return 1000;
        }
    }

    if (ddt->count_wait_for_reply < 4000 && 
        !dmtqueue_empty(ddt->datas)) {
        dispatch_thread_send_data(ddt);
    }

    /* At the end of this loop */
    if (test_if_need_pause() && 
        all_produce_threads_paused() && 
        all_backend_threads_paused() && 
        dmtqueue_empty(ddt->datas) &&
        dlistLength(ddt->rdatas) == 0) {
        
        ddt->pause = 1;

        /* Update the dispatch state */
        update_state_add(total_tested_commands_count_per_cycle,
            ddt->reply_total_count_per_cycle);
        update_state_add(total_tested_commands_count,
            ddt->reply_total_count_per_cycle);
        ddt->reply_total_count_per_cycle = 0;
        update_state_add(total_reply_err_count_per_cycle,
            ddt->reply_type_err_count_per_cycle);
        update_state_add(total_reply_err_count,
            ddt->reply_type_err_count_per_cycle);
        ddt->reply_type_err_count_per_cycle = 0;

        one_dispatch_thread_paused();
    }

    ddt->cronloops ++;
    return 1000/ddt->hz;
}

static void connect_callback(const redisAsyncContext *c, int status) {
    dispatch_data_thread *ddt = c->data;
    if (status != REDIS_OK) {
        log_error("Error: %s\n", c->errstr);
        //aeStop(loop);
        return;
    }

    //test_log_out("Connected...\n");
}

static void disconnect_callback(const redisAsyncContext *c, int status) {
    dispatch_data_thread *ddt = c->data;
    if (status != REDIS_OK) {
        log_error("Error: %s\n", c->errstr);
        //aeStop(loop);
        return;
    }

    //test_log_out("Disconnected...\n");
    //aeStop(loop);
}

static int dispatch_conn_context_init(conn_context *cc, char *host, int port)
{
    cc->ctx = NULL;
    cc->actx = NULL;

    cc->actx = redisAsyncConnect(host, port);
    if (cc->actx == NULL) {
        return VRT_ERROR;
    }
    
    return VRT_OK;
}

static void dispatch_conn_context_deinit(conn_context *cc)
{
    if (cc->ctx) {
        redisFree(cc->ctx);
        cc->ctx == NULL;
    }

    if (cc->actx) {
        redisAsyncFree(cc->actx);
        cc->actx == NULL;
    }
}

static int dispatch_data_thread_init(dispatch_data_thread *ddt, char *test_target_groups, int connections)
{
    int i, j, k;

    ddt->id = 0;
    ddt->thread_id = 0;
    ddt->el = NULL;
    ddt->hz = 10;
    ddt->cronloops = 0;
    ddt->datas = NULL;
    ddt->rdatas = NULL;
    ddt->abgs = NULL;
    ddt->pause = 0;
    ddt->count_wait_for_reply = 0;
    ddt->reply_total_count_per_cycle = 0;
    ddt->reply_type_err_count_per_cycle = 0;

    ddt->el = aeCreateEventLoop(200);
    if (ddt->el == NULL) {
        return VRT_ERROR;
    }

    ddt->datas = dmtqueue_create();
    if (ddt->datas == NULL) {
        return VRT_ERROR;
    }

    if (dmtqueue_init_with_lockqueue(ddt->datas, NULL) != 0) {
        return VRT_ERROR;
    }

    ddt->rdatas = dlistCreate();
    if (ddt->rdatas == NULL) {
        return VRT_ERROR;
    }
    
    ddt->abgs = abtest_groups_create(test_target_groups);
    if (ddt->abgs == NULL) {
        return VRT_ERROR;
    }

    /* Init connection context for each server */
    for (i = 0; i < darray_n(ddt->abgs); i ++) {
        abtest_group *abg = darray_get(ddt->abgs, i);
        for (j = 0; j < darray_n(&abg->abtest_servers); j ++) {
            abtest_server *abs = darray_get(&abg->abtest_servers, j);
            abs->conn_contexts = darray_create(connections, sizeof(conn_context));
            for (k = 0; k < connections; k ++) {
                conn_context *cc = darray_push(abs->conn_contexts);
                if (dispatch_conn_context_init(cc,abs->host,abs->port) != VRT_OK) {
                    return VRT_ERROR;
                }
                cc->actx->data = ddt;
                redisAeAttach(ddt->el, cc->actx);
                redisAsyncSetConnectCallback(cc->actx,connect_callback);
                redisAsyncSetDisconnectCallback(cc->actx,disconnect_callback);
            }
        }
    }

    if (aeCreateTimeEvent(ddt->el, 1, dispatch_data_thread_cron, ddt, NULL) == AE_ERR) {
        return VRT_ERROR;
    }
    
    return VRT_OK;
}

static void dispatch_data_thread_deinit(dispatch_data_thread *ddt)
{
    if (ddt->el) {
        aeDeleteEventLoop(ddt->el);
        ddt->el = NULL;
    }

    if (ddt->datas) {
        dmtqueue_destroy(ddt->datas);
        ddt->datas = NULL;
    }

    if (ddt->abgs) {
        int i, j, k;
        /* Deinit connection context for each server */
        for (i = 0; i < darray_n(ddt->abgs); i ++) {
            abtest_group *abg = darray_get(ddt->abgs, i);
            for (j = 0; j < darray_n(&abg->abtest_servers); j ++) {
                abtest_server *abs = darray_get(&abg->abtest_servers, j);
                while (darray_n(abs->conn_contexts) > 0) {
                    conn_context *cc = darray_pop(abs->conn_contexts);
                    dispatch_conn_context_deinit(cc);
                }
            }
        }
        
        abtest_groups_destroy(ddt->abgs);
        ddt->abgs = NULL;
    }
}

int vrt_dispatch_data_init(int threads_count, char *test_target_groups, int connections)
{
    int j;
    
    dispatch_data_threads_count = threads_count;
    dispatch_data_threads = darray_create(threads_count, sizeof(dispatch_data_thread));
    if (dispatch_data_threads == NULL) {
        return VRT_ERROR;
    }

    for (j = 0; j < threads_count; j ++) {
        dispatch_data_thread *ddt = darray_push(dispatch_data_threads);
        if (dispatch_data_thread_init(ddt, test_target_groups, connections) != VRT_OK) {
            return VRT_ERROR;
        }
        ddt->id = j;
    }
    
    return VRT_OK;
}

void vrt_dispatch_data_deinit(void)
{
    if (dispatch_data_threads) {
        while (darray_n(dispatch_data_threads) > 0) {
            dispatch_data_thread *ddt = darray_pop(dispatch_data_threads);
            dispatch_data_thread_deinit(ddt);
        }
        darray_destroy(dispatch_data_threads);
        dispatch_data_threads = NULL;
    }
}

static void *vrt_dispatch_data_thread_run(void *args)
{
    dispatch_data_thread *ddt = args;
    srand(vrt_usec_now()^(int)pthread_self());

    aeMain(ddt->el);
    
    return NULL;
}

int vrt_start_dispatch_data(void)
{
    unsigned int i;
    for (i = 0; i < darray_n(dispatch_data_threads); i ++) {
        pthread_attr_t attr;
        dispatch_data_thread *ddt;
        pthread_attr_init(&attr);
        ddt = darray_get(dispatch_data_threads, i);
        pthread_create(&ddt->thread_id, 
            &attr, vrt_dispatch_data_thread_run, ddt);
    }
    
    return VRT_OK;
}

int vrt_wait_dispatch_data(void)
{
    unsigned int i;
    /* wait for the produce threads finish */
	for(i = 0; i < darray_n(dispatch_data_threads); i ++){
		dispatch_data_thread *ddt = darray_get(dispatch_data_threads, i);
		pthread_join(ddt->thread_id, NULL);
	}
    
    return VRT_OK;
}

/* return value 
  * 1: need sleep a while because of there are too many data cached
  * 0: can normally continue
  * -1: error occur */
int data_dispatch(data_unit *du)
{
    int thread_idx;
    dispatch_data_thread *ddt;
    long long length;
    int *keyindex, numkeys;

    keyindex = get_keys_from_data_producer(du->dp, du->argv, du->argc, &numkeys);

    if (numkeys == 0) {
        du->hashvalue = (unsigned int)rand();
    } else {
        sds key = du->argv[keyindex[0]];
        du->hashvalue = (unsigned int)hash_crc32a(key, sdslen(key));
    }
    free(keyindex);
    
    thread_idx = du->hashvalue%dispatch_data_threads_count;
    ddt = darray_get(dispatch_data_threads, thread_idx);
    length = dmtqueue_push(ddt->datas, du);
    if (length <= 0) {
        test_log_error("Data unit push to dispatch thread %d failed", ddt->id);
        return -1;
    } else if (length > 2000) {
        return 1;
    }

    return 0;
}


================================================
FILE: tests/vrt_dispatch_data.h
================================================
#ifndef _VRT_DISPATCH_DATA_H_
#define _VRT_DISPATCH_DATA_H_

#include <darray.h>

struct abtest_group;
struct dlist;
struct dmtqueue;
struct data_unit;
struct aeEventLoop;

typedef struct dispatch_data_thread {
    int id;
    pthread_t thread_id;
    
    struct aeEventLoop *el;
    int hz;
    int cronloops;          /* Number of times the cron function run */

    struct dmtqueue *datas;  /* Value is data_unit, used receive data 
                                        from produce data thread, and send to the abtest groups. */
    struct dlist *rdatas;   /* Value is reply_unit, used to cache data 
                                        that has not received from abtest groups completely */

    darray *abgs; /* type is abtest_group */

    int pause;

    int count_wait_for_reply;

    long long reply_total_count_per_cycle;
    long long reply_type_err_count_per_cycle;
} dispatch_data_thread;

extern int dispatch_data_threads_count;

extern int dispatch_threads_pause_finished_count;

long long get_total_tested_commands_count_per_cycle(void);
long long get_total_reply_err_count_per_cycle(void);
void reset_total_count_per_cycle(void);

int vrt_dispatch_data_init(int threads_count, char *test_target_groups, int connections);
void vrt_dispatch_data_deinit(void);

int vrt_start_dispatch_data(void);
int vrt_wait_dispatch_data(void);

int data_dispatch(struct data_unit *du);

#endif


================================================
FILE: tests/vrt_produce_data.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <getopt.h>
#include <fcntl.h>
#include <errno.h>
#include <signal.h>
#include <assert.h>
#include <math.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <dspecialconfig.h>

#include <hiredis.h>
#include <darray.h>
#include <dutil.h>
#include <dlog.h>

#include <vrt_util.h>
#include <vrt_public.h>
#include <vrabtest.h>
#include <vrt_produce_data.h>

#define PRODUCE_KEY_CACHE_POOL_COUNT 5

typedef struct produce_thread {
    int id;
    pthread_t thread_id;

    produce_scheme *ps;

    int pause;
    long long looptimes;
} produce_thread;

data_producer *delete_data_producer = NULL;

static unsigned int key_length_min;
static unsigned int key_length_max;
static unsigned int key_length_range_gap;
static unsigned int field_length_max;
static unsigned int string_length_max;

static int cmd_type;

static int key_cache_pools_count = 0;

static darray needed_cmd_type_producer;  /* type:  data_producer*/
static unsigned int needed_cmd_type_producer_count;

int produce_data_threads_count;
static darray produce_threads;

int produce_threads_pause_finished_count;

static int non_empty_kcps_count = 0;
unsigned int non_empty_kcps_idx[PRODUCE_KEY_CACHE_POOL_COUNT] = {-1};

static sds get_random_cached_key(produce_scheme *ps, data_producer *dp)
{
    key_cache_array *kcp = kcp_get_from_ps(ps,dp);
    return key_cache_array_random(kcp);
}

static int get_random_int(void)
{
    if (rand()%2 == 1) {
        return 0 - (int)rand();
    } else {
        return (int)rand();
    }
}

static unsigned int get_random_unsigned_int(void)
{
    return (unsigned int)rand();
}

static char get_random_char(void)
{
    return (char)rand()%250 + 5;
    //return (char)(rand()%25 + 97);
}

static sds get_random_key(void)
{
    unsigned int i, len;
    sds str = sdsempty();
    
    len = key_length_range_gap==0?key_length_min:
        (get_random_unsigned_int()%key_length_range_gap+key_length_min);
    if (len == 0) len ++;
    str = sdsMakeRoomFor(str,(size_t)len);
    sdsIncrLen(str, (int)len);

    for (i = 0; i < len; i ++) {
        str[i] = (char)get_random_char();
    }

    return str;
}

static sds get_random_string(void)
{
    unsigned int i, len;
    sds str = sdsempty();
    
    len = get_random_unsigned_int()%string_length_max;
    str = sdsMakeRoomFor(str,(size_t)len);
    sdsIncrLen(str, (int)len);

    for (i = 0; i < len; i ++) {
        str[i] = get_random_char();
    }

    return str;
}

static sds get_random_float_str(void)
{
    unsigned int decimal_len;
    sds str;

    if (rand()%2 == 1) {
        str = sdsnew("-");
    } else {
        str = sdsempty();
    }

    if (rand()%2 == 1) {
        str = sdscatfmt(str,"%u.%u",
            get_random_unsigned_int(),
            get_random_unsigned_int());
    } else {
        str = sdscatfmt(str,"%u",
            get_random_unsigned_int());
    }

    return str;
}

#define ZSET_RANGE_MIN_MAX_TYPE_RANK    0
#define ZSET_RANGE_MIN_MAX_TYPE_SCORE   1
#define ZSET_RANGE_MIN_MAX_TYPE_LEX     2
static sds *get_random_zset_range_min_max_str(int range_type)
{
    sds *range; /* range[0] is the min, range[1] is the max */
    unsigned int probability = rand()%100;

    range = malloc(2*sizeof(sds));
    if (range_type == ZSET_RANGE_MIN_MAX_TYPE_RANK) {
        unsigned int min = get_random_unsigned_int();
        unsigned int max = get_random_unsigned_int();

        if (probability >= 95 && min <= max || 
            probability < 95 && min > max) {
            range[0] = sdsfromlonglong((long long)max);
            range[1] = sdsfromlonglong((long long)min);
        } else {
            range[0] = sdsfromlonglong((long long)min);
            range[1] = sdsfromlonglong((long long)max);
        }
    } else if (range_type == ZSET_RANGE_MIN_MAX_TYPE_SCORE) {
        sds min_str = get_random_float_str();
        sds max_str = get_random_float_str();
        float min, max;
        char *eptr;
        sds swap;
        unsigned int min_probability = rand()%3;
        unsigned int max_probability = rand()%3;

        min = strtod(min_str,&eptr);
        if (eptr[0] != '\0' || isnan(min)) {
            sdsfree(min_str);
            sdsfree(max_str);
            free(range);
            return NULL;
        }
        max = strtod(max_str,&eptr);
        if (eptr[0] != '\0' || isnan(max)) {
            sdsfree(min_str);
            sdsfree(max_str);
            free(range);
            return NULL;
        }
        if (probability >= 95 && min <= max || 
            probability < 95 && min > max) {
            swap = min_str;
            min_str = max_str;
            max_str = swap;
        }
        
        if (min_probability == 0) {
            range[0] = sdsnew("-inf");
        } else if (min_probability == 1) {
            range[0] = sdsnew("(");
            range[0] = sdscatfmt(range[0],"%S",min_str);
            sdsfree(min_str);
        } else {
            range[0] = min_str;
        }
        if (max_probability == 0) {
            range[1] = sdsnew("+inf");
        } else if (max_probability == 1) {
            range[1] = sdsnew("(");
            range[1] = sdscatfmt(range[1],"%S",max_str);
            sdsfree(max_str);
        } else {
            range[1] = max_str;
        }
    } else if (range_type == ZSET_RANGE_MIN_MAX_TYPE_LEX) {
        sds min_str = get_random_string();
        sds max_str = get_random_string();
        sds swap;
        unsigned int min_probability = rand()%3;
        unsigned int max_probability = rand()%3;

        if (probability >= 95 && sdscmp(min_str,max_str) < 0 || 
            probability < 95 && sdscmp(min_str,max_str) > 0) {
            swap = min_str;
            min_str = max_str;
            max_str = swap;
        }
        
        if (min_probability == 0) {
            range[0] = sdsnew("-");
        } else if (min_probability == 1) {
            range[0] = sdsnew("(");
            range[0] = sdscatfmt(range[0],"%S",min_str);
            sdsfree(min_str);
        } else {
            range[0] = sdsnew("[");
            range[0] = sdscatfmt(range[0],"%S",min_str);
            sdsfree(min_str);
        }
        if (max_probability == 0) {
            range[1] = sdsnew("+");
        } else if (max_probability == 1) {
            range[1] = sdsnew("(");
            range[1] = sdscatfmt(range[1],"%S",max_str);
            sdsfree(max_str);
        } else {
            range[1] = sdsnew("[");
            range[1] = sdscatfmt(range[1],"%S",max_str);
            sdsfree(max_str);
        }
    } else {
        free(range);
        range = NULL; 
    }

    return range;
}

static unsigned int get_random_field_len(void)
{
    return get_random_unsigned_int()%field_length_max + 1;
}

static sds get_random_key_with_hit_ratio(produce_scheme *ps, data_producer *dp)
{
    sds key;
    if (ps->hit_ratio_array[ps->hit_ratio_idx++] == 0) {
        key = get_random_key();
    } else {
        key = get_random_cached_key(ps,dp);
        if (key == NULL) key = get_random_key();
    }
    if (ps->hit_ratio_idx >= ps->hit_ratio_array_len) {
        ps->hit_ratio_idx = 0;
    }
    return key;
}

/************** Need cache key implement ************/
static int nck_when_noerror(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type != REDIS_REPLY_ERROR) {
        return 1;
    }

    return 0;
}

static int nck_when_ok(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_STATUS && 
        !strcmp(reply->str, "OK")) {
        return 1;
    }

    return 0;
}

static int nck_when_str(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_STRING) {
        return 1;
    }

    return 0;
}

static int nck_when_unsigned_integer(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER && 
        reply->integer >= 0) {
        return 1;
    }

    return 0;
}

static int nck_when_nonzero_unsigned_integer(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER && 
        reply->integer > 0) {
        return 1;
    }

    return 0;
}

static int nck_when_zero_or_one(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER && 
        (reply->integer == 0 || reply->integer == 1)) {
        return 1;
    }

    return 0;
}

static int nck_when_one(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER && 
        reply->integer == 1) {
        return 1;
    }

    return 0;
}

/************** Need cache key implement end ************/

static data_unit *get_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *set_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    du->argv[2] = get_random_string();
    
    return du;
}

static data_unit *setnx_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
    
    return du;
}

/* Need cache key? */
static int setnx_cmd_nck(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER && 
        reply->integer == 1) {
        return 1;
    }

    return 0;
}

static data_unit *setex_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    du->argv[2] = sdsfromlonglong(rand()%10000);
    du->argv[3] = get_random_string();
    
    return du;
}

static data_unit *psetex_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    du->argv[2] = sdsfromlonglong(rand()%10000);
    du->argv[3] = get_random_string();
    
    return du;
}

static data_unit *del_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    
    return du;
}

static data_unit *expire_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong(rand()%10000);
    
    return du;
}

static data_unit *expireat_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong(vrt_msec_now()/1000LL+rand()%10000);
    
    return du;
}

static data_unit *exists_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *ttl_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *pttl_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *incr_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    
    return du;
}

static data_unit *decr_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    
    return du;
}

static data_unit *incrby_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    du->argv[2] = sdsfromlonglong(rand()%10000);
    
    return du;
}

static data_unit *decrby_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    du->argv[2] = sdsfromlonglong(rand()%10000);
    
    return du;
}

static data_unit *append_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    du->argv[2] = get_random_string();
    
    return du;
}

/* Need cache key? */
static int append_cmd_nck(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER) {
        return 1;
    }

    return 0;
}

static data_unit *strlen_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *getset_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
    
    return du;
}

static data_unit *incrbyfloat_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_float_str();
    
    return du;
}

static data_unit *setbit_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong(get_random_unsigned_int()%30000);
    if (rand()%2) {
        du->argv[3] = sdsnew("1");
    } else {
        du->argv[3] = sdsnew("0");
    }
    
    return du;
}

static data_unit *getbit_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong(get_random_unsigned_int()%30000);
    
    return du;
}

static data_unit *setrange_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong(get_random_unsigned_int()%30000);
    du->argv[3] = get_random_string();
    
    return du;
}

static data_unit *getrange_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong(get_random_int()%30000);
    du->argv[3] = sdsfromlonglong(get_random_int()%30000);
    
    return du;
}

static data_unit *bitcount_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    int with_range = 0;

    if (rand()%2)
        with_range = 1;

    du = data_unit_get();
    du->dp = dp;
    du->argc = with_range?4:2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    if (with_range) {
        du->argv[2] = sdsfromlonglong(get_random_int()%30000);
        du->argv[3] = sdsfromlonglong(get_random_int()%30000);
    }
    return du;
}

static data_unit *bitpos_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    int with_range = 0; /* 0: no range; 1: just have start; 2: have start and end. */
    unsigned int probability = rand()%3;
    
    if (probability == 0)
        with_range = 0;
    else if (probability == 1)
        with_range = 1;
    else if (probability == 2)
        with_range = 2;

    du = data_unit_get();
    du->dp = dp;
    du->argc = with_range==0?3:(with_range==1?4:5);
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    if (rand()%2)
        du->argv[2] = sdsnew("0");
    else
        du->argv[2] = sdsnew("1");
    if (with_range > 0)
        du->argv[3] = sdsfromlonglong(get_random_int()%30000);
    if (with_range == 2)
        du->argv[4] = sdsfromlonglong(get_random_int()%30000);

    return du;
}

static data_unit *mget_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *mset_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    du->argv[2] = get_random_string();
    
    return du;
}

static data_unit *hset_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    du->argv[2] = get_random_string();
    du->argv[3] = get_random_string();
    
    return du;
}

static data_unit *hget_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
    
    return du;
}

static data_unit *hlen_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *hdel_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    field_length = get_random_field_len();

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2 + field_length;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    for (j = 0; j < field_length; j ++) {
        du->argv[2+j] = get_random_string();
    }
    
    return du;
}

static data_unit *hexists_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
    
    return du;
}

static data_unit *hkeys_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *hvals_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *hgetall_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *hincrby_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
    du->argv[3] = sdsfromlonglong(get_random_int());
    
    return du;
}

static data_unit *hincrbyfloat_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
    du->argv[3] = get_random_float_str();
    
    return du;
}

static data_unit *hmget_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    field_length = get_random_field_len();

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2+field_length;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    for (j = 0; j < field_length; j ++) {
        du->argv[2+j] = get_random_string();
    }
    
    return du;
}

static data_unit *hmset_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    field_length = get_random_field_len();

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2+field_length*2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    for (j = 2; j < 2+field_length*2; j += 2) {
        du->argv[j] = get_random_string();
        du->argv[j+1] = get_random_string();
    }
    
    return du;
}

static data_unit *hsetnx_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();
    du->argv[2] = get_random_string();
    du->argv[3] = get_random_string();
    
    return du;
}

static data_unit *hstrlen_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
    
    return du;
}

static data_unit *rpush_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    field_length = get_random_field_len();

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2+field_length;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    for (j = 0; j < field_length; j ++) {
        du->argv[2+j] = get_random_string();
    }
    
    return du;
}

/* Need cache key? */
static int rpush_cmd_nck(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER) {
        return 1;
    }

    return 0;
}

static data_unit *lpush_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    field_length = get_random_field_len();

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2+field_length;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);

    for (j = 0; j < field_length; j ++) {
        du->argv[2+j] = get_random_string();
    }
    
    return du;
}

static data_unit *lrange_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong((long long)get_random_int()%(field_length_max+1));
    du->argv[3] = sdsfromlonglong((long long)get_random_int()%(field_length_max+1));
    
    return du;
}

static data_unit *rpop_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *lpop_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *llen_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *lrem_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong((long long)get_random_int()%(field_length_max+1));
    du->argv[3] = get_random_string();
    
    return du;
}

static data_unit *ltrim_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong((long long)get_random_int()%(field_length_max+1));
    du->argv[3] = sdsfromlonglong((long long)get_random_int()%(field_length_max+1));
    
    return du;
}

static data_unit *lindex_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong((long long)get_random_int()%(field_length_max+1));
    
    return du;
}

static data_unit *lset_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong((long long)get_random_int()%(field_length_max+1));
    du->argv[3] = get_random_string();
    
    return du;
}

static data_unit *sadd_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    field_length = get_random_field_len();

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2 + field_length;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    for (j = 0; j < field_length; j ++) {
        du->argv[2+j] = get_random_string();
    }
    
    return du;
}

static data_unit *smembers_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *scard_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *srem_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    field_length = get_random_field_len();

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2+field_length;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    for (j = 0; j < field_length; j ++) {
        du->argv[2+j] = get_random_string();
    }
    
    return du;
}

static data_unit *sismember_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
    
    return du;
}

static data_unit *sunion_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *sdiff_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *sinter_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

/* Need cache key? */
static int lpush_cmd_nck(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER) {
        return 1;
    }

    return 0;
}

static data_unit *zadd_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    field_length = get_random_field_len();

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2+field_length*2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key();

    for (j = 2; j < 2+field_length*2; j += 2) {
        du->argv[j] = get_random_float_str();
        du->argv[j+1] = get_random_string();
    }
    
    return du;
}

/* Need cache key? */
static int zadd_cmd_nck(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER) {
        return 1;
    }

    return 0;
}

static data_unit *zincrby_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_float_str();;
    du->argv[3] = get_random_string();
    
    return du;
}

/* Need cache key? */
static int zincrby_cmd_nck(redisReply *reply)
{
    if (reply == NULL) return 0;

    if (reply->type == REDIS_REPLY_INTEGER) {
        return 1;
    }

    return 0;
}

static data_unit *zrange_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;
    int withscores;

    if (rand()%2 == 1) {
        withscores = 1;
    } else {
        withscores = 0;
    }

    du = data_unit_get();
    du->dp = dp;
    du->argc = withscores?5:4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong(0);
    du->argv[3] = sdsfromlonglong(get_random_int()%10000);
    if (withscores) du->argv[4] = sdsnew("withscores");
    
    return du;
}

static data_unit *zrevrange_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;
    int withscores;

    if (rand()%2 == 1) {
        withscores = 1;
    } else {
        withscores = 0;
    }

    du = data_unit_get();
    du->dp = dp;
    du->argc = withscores?5:4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = sdsfromlonglong(0);
    du->argv[3] = sdsfromlonglong(get_random_int()%10000);
    if (withscores) du->argv[4] = sdsnew("withscores");
    
    return du;
}

static data_unit *zrem_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int j, field_length;

    field_length = get_random_field_len();

    du = data_unit_get();
    du->dp = dp;
    du->argc = 2+field_length;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);

    for (j = 2; j < 2+field_length; j ++) {
        du->argv[j] = get_random_string();
    }
    
    return du;
}

static data_unit *zcard_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    
    du = data_unit_get();
    du->dp = dp;
    du->argc = 2;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    
    return du;
}

static data_unit *zcount_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    sds *range = get_random_zset_range_min_max_str(ZSET_RANGE_MIN_MAX_TYPE_SCORE);
    
    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = range[0];
    du->argv[3] = range[1];

    free(range);
    return du;
}

static data_unit *zrangebyscore_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int idx = 0, arg_count = 0;
    int withscores,limit;
    sds *range = get_random_zset_range_min_max_str(ZSET_RANGE_MIN_MAX_TYPE_SCORE);

    arg_count = 4;
    if (rand()%2 == 1) {
        withscores = 1;
        arg_count ++;
    } else {
        withscores = 0;
    }
    if (rand()%2 == 1) {
        limit = 1;
        arg_count += 3;
    } else {
        limit = 0;
    }

    du = data_unit_get();
    du->dp = dp;
    du->argc = arg_count;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[idx++] = sdsnew(dp->name);
    du->argv[idx++] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[idx++] = range[0];
    du->argv[idx++] = range[1];
    if (withscores) du->argv[idx++] = sdsnew("withscores");
    if (limit) {
        du->argv[idx++] = sdsnew("limit");
        du->argv[idx++] = sdsfromlonglong(get_random_unsigned_int());
        du->argv[idx++] = sdsfromlonglong(get_random_unsigned_int());
    }

    ASSERT(arg_count == idx);

    free(range);
    return du;
}

static data_unit *zrevrangebyscore_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    unsigned int idx = 0, arg_count = 0;
    int withscores,limit;
    sds *range = get_random_zset_range_min_max_str(ZSET_RANGE_MIN_MAX_TYPE_SCORE);

    arg_count = 4;
    if (rand()%2 == 1) {
        withscores = 1;
        arg_count ++;
    } else {
        withscores = 0;
    }
    if (rand()%2 == 1) {
        limit = 1;
        arg_count += 3;
    } else {
        limit = 0;
    }

    du = data_unit_get();
    du->dp = dp;
    du->argc = arg_count;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[idx++] = sdsnew(dp->name);
    du->argv[idx++] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[idx++] = range[0];
    du->argv[idx++] = range[1];
    if (withscores) du->argv[idx++] = sdsnew("withscores");
    if (limit) {
        du->argv[idx++] = sdsnew("limit");
        du->argv[idx++] = sdsfromlonglong(get_random_unsigned_int());
        du->argv[idx++] = sdsfromlonglong(get_random_unsigned_int());
    }

    ASSERT(arg_count == idx);

    free(range);
    return du;
}

static data_unit *zrank_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    
    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
        
    return du;
}

static data_unit *zrevrank_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    
    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
        
    return du;
}

static data_unit *zscore_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    
    du = data_unit_get();
    du->dp = dp;
    du->argc = 3;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = get_random_string();
        
    return du;
}

static data_unit *zremrangebyscore_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    sds *range = get_random_zset_range_min_max_str(ZSET_RANGE_MIN_MAX_TYPE_SCORE);
    
    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = range[0];
    du->argv[3] = range[1];

    free(range);
    return du;
}

static data_unit *zremrangebyrank_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    sds *range = get_random_zset_range_min_max_str(ZSET_RANGE_MIN_MAX_TYPE_RANK);
    
    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = range[0];
    du->argv[3] = range[1];

    free(range);
    return du;
}

static data_unit *zremrangebylex_cmd_producer(data_producer *dp, produce_scheme *ps)
{
    data_unit *du;
    sds *range = get_random_zset_range_min_max_str(ZSET_RANGE_MIN_MAX_TYPE_LEX);
    
    du = data_unit_get();
    du->dp = dp;
    du->argc = 4;
    du->argv = malloc(du->argc*sizeof(sds));
    du->argv[0] = sdsnew(dp->name);
    du->argv[1] = get_random_key_with_hit_ratio(ps,dp);
    du->argv[2] = range[0];
    du->argv[3] = range[1];

    free(range);
    return du;
}

static int producers_count;
data_producer redis_data_producer_table[] = {
    /* Key */
    {"del",del_cmd_producer,-2,"w",0,NULL,1,-1,1,TEST_CMD_TYPE_KEY,NULL},
    {"exists",exists_cmd_producer,-2,"rF",0,NULL,1,-1,1,TEST_CMD_TYPE_KEY,NULL},
    {"ttl",ttl_cmd_producer,2,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_EXPIRE,NULL},
    {"pttl",pttl_cmd_producer,2,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_EXPIRE,NULL},
    {"expire",expire_cmd_producer,3,"wF",0,NULL,1,1,1,TEST_CMD_TYPE_EXPIRE,NULL},
    {"expireat",expireat_cmd_producer,3,"wF",0,NULL,1,1,1,TEST_CMD_TYPE_EXPIRE,NULL},
    /* String */
    {"get",get_cmd_producer,2,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"set",set_cmd_producer,-3,"wmA",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,nck_when_ok},
    {"setnx",setnx_cmd_producer,3,"wmFA",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,setnx_cmd_nck},
    {"setex",setex_cmd_producer,4,"wmA",0,NULL,1,1,1,TEST_CMD_TYPE_EXPIRE,nck_when_ok},
    {"psetex",psetex_cmd_producer,4,"wmA",0,NULL,1,1,1,TEST_CMD_TYPE_EXPIRE,nck_when_ok},
    {"incr",incr_cmd_producer,2,"wmF",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"decr",decr_cmd_producer,2,"wmF",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"incrby",incrby_cmd_producer,3,"wmF",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"decrby",decrby_cmd_producer,3,"wmF",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"append",append_cmd_producer,3,"wmA",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,append_cmd_nck},
    {"strlen",strlen_cmd_producer,2,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"getset",getset_cmd_producer,3,"wmA",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,nck_when_noerror},
    {"incrbyfloat",incrbyfloat_cmd_producer,3,"wmFA",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,nck_when_str},
    {"setbit",setbit_cmd_producer,4,"wmA",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,nck_when_zero_or_one},
    {"getbit",getbit_cmd_producer,3,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"setrange",setrange_cmd_producer,4,"wmA",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,nck_when_nonzero_unsigned_integer},
    {"getrange",getrange_cmd_producer,4,"r",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"bitcount",bitcount_cmd_producer,-2,"r",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"bitpos",bitpos_cmd_producer,-3,"r",0,NULL,1,1,1,TEST_CMD_TYPE_STRING,NULL},
    {"mget",mget_cmd_producer,-2,"r",0,NULL,1,-1,1,TEST_CMD_TYPE_STRING,NULL},
    {"mset",mset_cmd_producer,-3,"wmA",0,NULL,1,-1,2,TEST_CMD_TYPE_STRING,nck_when_ok},
    /* Hash */
    {"hset",hset_cmd_producer,4,"wmFA",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,nck_when_one},
    {"hget",hget_cmd_producer,3,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hlen",hlen_cmd_producer,2,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hdel",hdel_cmd_producer,-3,"wF",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hexists",hexists_cmd_producer,3,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hkeys",hkeys_cmd_producer,2,"rS",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hvals",hvals_cmd_producer,2,"rS",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hgetall",hgetall_cmd_producer,2,"r",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hincrby",hincrby_cmd_producer,4,"wmF",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hincrbyfloat",hincrbyfloat_cmd_producer,4,"wmF",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hmget",hmget_cmd_producer,-3,"r",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    {"hmset",hmset_cmd_producer,-4,"wmA",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,nck_when_ok},
    {"hsetnx",hsetnx_cmd_producer,4,"wmFA",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,nck_when_one},
    {"hstrlen",hstrlen_cmd_producer,3,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_HASH,NULL},
    /* List */
    {"rpush",rpush_cmd_producer,-3,"wmFA",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,rpush_cmd_nck},
    {"lpush",lpush_cmd_producer,-3,"wmFA",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,lpush_cmd_nck},
    {"lrange",lrange_cmd_producer,4,"r",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,NULL},
    {"rpop",rpop_cmd_producer,2,"wF",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,NULL},
    {"lpop",lpop_cmd_producer,2,"wF",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,NULL},
    {"llen",llen_cmd_producer,2,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,NULL},
    {"lrem",lrem_cmd_producer,4,"w",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,NULL},
    {"ltrim",ltrim_cmd_producer,4,"w",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,NULL},
    {"lindex",lindex_cmd_producer,3,"r",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,NULL},
    {"lset",lset_cmd_producer,4,"wm",0,NULL,1,1,1,TEST_CMD_TYPE_LIST,NULL},
    /* Set */
    {"sadd",sadd_cmd_producer,-3,"wmFA",0,NULL,1,1,1,TEST_CMD_TYPE_SET,nck_when_unsigned_integer},
    {"smembers",smembers_cmd_producer,2,"rS",0,NULL,1,1,1,TEST_CMD_TYPE_SET,NULL},
    {"scard",scard_cmd_producer,2,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_SET,NULL},
    {"srem",srem_cmd_producer,-3,"wF",0,NULL,1,1,1,TEST_CMD_TYPE_SET,NULL},
    {"sismember",sismember_cmd_producer,3,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_SET,NULL},
    {"sunion",sunion_cmd_producer,-2,"rS",0,NULL,1,-1,1,TEST_CMD_TYPE_SET,NULL},
    {"sdiff",sdiff_cmd_producer,-2,"rS",0,NULL,1,-1,1,TEST_CMD_TYPE_SET,NULL},
    {"sinter",sinter_cmd_producer,-2,"rS",0,NULL,1,-1,1,TEST_CMD_TYPE_SET,NULL},
    /* SortedSet */
    {"zadd",zadd_cmd_producer,-4,"wmFA",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,zadd_cmd_nck},
    {"zincrby",zincrby_cmd_producer,4,"wmFA",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,zincrby_cmd_nck},
    {"zrange",zrange_cmd_producer,-4,"r",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zrevrange",zrevrange_cmd_producer,-4,"r",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zrem",zrem_cmd_producer,-3,"wF",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zcard",zcard_cmd_producer,2,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zcount",zcount_cmd_producer,4,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zrangebyscore",zrangebyscore_cmd_producer,-4,"r",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zrevrangebyscore",zrevrangebyscore_cmd_producer,-4,"r",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zrank",zrank_cmd_producer,3,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zrevrank",zrevrank_cmd_producer,3,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zscore",zscore_cmd_producer,3,"rF",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zremrangebyscore",zremrangebyscore_cmd_producer,4,"w",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL},
    {"zremrangebyrank",zremrangebyrank_cmd_producer,4,"w",0,NULL,1,1,1,TEST_CMD_TYPE_ZSET,NULL}
};

data_unit *data_unit_get(void)
{
    data_unit *du = malloc(sizeof(data_unit));
    du->dp = NULL;
    du->argc = 0;
    du->argv = NULL;
    du->hashvalue = 0;
    du->data = NULL;
    return du;
}

void data_unit_put(data_unit *du)
{
    int idx;
    
    for (idx = 0; idx < du->argc; idx ++) {
        if (du->argv[idx])
            sdsfree(du->argv[idx]);
    }
    free(du->argv);
    free(du);
}

static produce_scheme *produce_scheme_create(long long max_cached_keys, int hit_ratio)
{
    produce_scheme *ps;
    int count, idx;
    int ratio;
    
    ps = malloc(sizeof(*ps));
    if (ps == NULL) return NULL;
    ps->kcps = NULL;
    ps->hit_ratio_array = NULL;

    ps->kcps = darray_create(PRODUCE_KEY_CACHE_POOL_COUNT,sizeof(key_cache_array *));
    for (idx = 0; idx < PRODUCE_KEY_CACHE_POOL_COUNT; idx ++) {
        key_cache_array **kcp = darray_push(ps->kcps);
        *kcp = key_cache_array_create(max_cached_keys/PRODUCE_KEY_CACHE_POOL_COUNT);
        if (*kcp == NULL) {
            return NULL;
        }
    }

    /* Generate the hit ratio. */
    ps->hit_ratio_array_len = 100;
    ps->hit_ratio = hit_ratio;
    ps->hit_ratio_idx = 0;
    ps->hit_ratio_array = malloc(ps->hit_ratio_array_len*sizeof(int));
    ratio = ps->hit_ratio_array_len/ps->hit_ratio;
    if (ratio > 1) {
        count = ps->hit_ratio;
        for (idx = 0; idx < ps->hit_ratio_array_len; idx ++) {
            ps->hit_ratio_array[idx] = 0;
        }
    } else {
        count = ps->hit_ratio_array_len - ps->hit_ratio;
        for (idx = 0; idx < ps->hit_ratio_array_len; idx ++) {
            ps->hit_ratio_array[idx] = 1;
        }
    }
    while (count > 0) {
        idx = rand()%ps->hit_ratio_array_len;
        if (ratio > 1) {
            if (ps->hit_ratio_array[idx] == 0) {
                count --;
                ps->hit_ratio_array[idx] = 1;
            }
        } else {
            if (ps->hit_ratio_array[idx] == 1) {
                count --;
                ps->hit_ratio_array[idx] = 0;
            }
        }
    }

    return ps;
}

static void produce_scheme_destroy(produce_scheme *ps)
{
    int j;
    if (ps->kcps) {
        for (j = 0; j < PRODUCE_KEY_CACHE_POOL_COUNT; j ++) {
            key_cache_array **kcp = darray_pop(ps->kcps);
            if (*kcp)key_cache_array_destroy(*kcp);
        }
        darray_destroy(ps->kcps);
    }
    
    free(ps->hit_ratio_array);

    free(ps);
}

static unsigned int get_kcp_idx(int type)
{
    unsigned int idx;
    
    switch(type)
    {
    case TEST_CMD_TYPE_STRING:
        idx = 0;
        break;
        
    case TEST_CMD_TYPE_LIST:
        idx = 1;
        break;

    case TEST_CMD_TYPE_SET:
        idx = 2;
        break;

    case TEST_CMD_TYPE_ZSET:
        idx = 3;
        break;

    case TEST_CMD_TYPE_HASH:
        idx = 4;
        break;

    default:
        idx = -1;
        break;
    }

    return idx;
}

static void set_non_empty_kcps_idx(void)
{
    if (cmd_type&TEST_CMD_TYPE_STRING) {
        non_empty_kcps_idx[non_empty_kcps_count++] = 
            get_kcp_idx(TEST_CMD_TYPE_STRING);
    }
    if (cmd_type&TEST_CMD_TYPE_LIST) {
        non_empty_kcps_idx[non_empty_kcps_count++] = 
            get_kcp_idx(TEST_CMD_TYPE_LIST);
    }
    if (cmd_type&TEST_CMD_TYPE_SET) {
        non_empty_kcps_idx[non_empty_kcps_count++] = 
            get_kcp_idx(TEST_CMD_TYPE_SET);
    }
    if (cmd_type&TEST_CMD_TYPE_ZSET) {
        non_empty_kcps_idx[non_empty_kcps_count++] = 
            get_kcp_idx(TEST_CMD_TYPE_ZSET);
    }
    if (cmd_type&TEST_CMD_TYPE_HASH) {
        non_empty_kcps_idx[non_empty_kcps_count++] = 
            get_kcp_idx(TEST_CMD_TYPE_HASH);
    }
}

/* Get a key cache pool from the produce scheme */
key_cache_array *kcp_get_from_ps(produce_scheme *ps, data_producer *dp)
{
    unsigned int idx;
    key_cache_array **kcp;
    
    if (ps == NULL || ps->kcps == NULL || dp == NULL) return NULL;

    if (dp->cmd_type == TEST_CMD_TYPE_KEY) {
        if (non_empty_kcps_count==0) {
            idx = -1;
        } else {
            idx = rand()%non_empty_kcps_count;
            idx = non_empty_kcps_idx[idx];
            ASSERT(idx >= 0);
        }  
    } else {
        idx = get_kcp_idx(dp->cmd_type);
    }
    
    if (idx >= PRODUCE_KEY_CACHE_POOL_COUNT || idx < 0) {
        return NULL;
    }

    kcp = darray_get(ps->kcps, idx);

    return *kcp;
}

static int vrt_produce_threads_init(unsigned int produce_threads_count, 
    long long cached_keys, int hit_ratio)
{
    unsigned int idx;
    darray_init(&produce_threads, produce_threads_count, sizeof(produce_thread));
    produce_data_threads_count = produce_threads_count;
    for (idx = 0; idx < produce_threads_count; idx ++) {
        produce_thread *pt = darray_push(&produce_threads);
        pt->id = idx;
        pt->thread_id = 0;
        pt->ps = produce_scheme_create(cached_keys, hit_ratio);
        pt->pause = 0;
        pt->looptimes = 0;
    }
    
    return VRT_OK;
}

static void vrt_produce_threads_deinit(void)
{
    produce_thread *pt;
    while (darray_n(&produce_threads) > 0) {
        pt = darray_pop(&produce_threads);
        if (pt->ps) {
            produce_scheme_destroy(pt->ps);
            pt->ps = NULL;
        }
    }
    darray_deinit(&produce_threads);
}

static void *vrt_produce_thread_run(void *args)
{
    int ret;
    produce_thread *pt = args;
    unsigned int idx, j;
    data_producer **dp;
    data_unit *du;

    srand(vrt_usec_now()^(int)pthread_self());

    while (1) {
        /* At begin of this loop */
        if (pt->pause) {
            usleep(1000000);    /* sleep 1 second */
            if (!test_if_need_pause()) {
                pt->pause = 0;
            } else {
                continue;
            }
        } else if (pt->looptimes%10000 == 0) {
            if (test_if_need_pause()) {
                pt->pause = 1;
                one_produce_thread_paused();
                continue;
            }
        }
        
        idx = rand()%needed_cmd_type_producer_count;
        dp = darray_get(&needed_cmd_type_producer,idx);
        du = (*dp)->proc(*dp,pt->ps);

        du->data = pt->ps;

        /* Dispatch the test data */
        ret = data_dispatch(du);
        if (ret == -1) {
            data_unit_put(du);
        } else if (ret == 1) {
            usleep(100000);
        }

        pt->looptimes ++;
    }
    
    return NULL;
}

static int add_to_needed_cmd_type_producer(data_producer *dp)
{
    data_producer **dp_elem = darray_push(&needed_cmd_type_producer);

    *dp_elem = dp;
    needed_cmd_type_producer_count ++;
    
    return VRT_OK;
}

int vrt_produce_data_init(int key_length_range_min,int key_length_range_max, 
    int string_max_length,int fields_max_count,
    int produce_cmd_types,darray *produce_cmd_blacklist,darray *produce_cmd_whitelist,
    unsigned int produce_threads_count,long long cached_keys,
    int hit_ratio)
{
    int j, k;
    
    key_length_min = key_length_range_min;
    key_length_max = key_length_range_max;
    if (key_length_max < key_length_min) return VRT_ERROR;
    key_length_range_gap = key_length_max-key_length_min;
    field_length_max = fields_max_count;
    string_length_max = string_max_length;
    cmd_type = produce_cmd_types;
    darray_init(&needed_cmd_type_producer, 100, sizeof(data_producer*));

    producers_count = sizeof(redis_data_producer_table)/sizeof(data_producer);
    for (j = 0; j < producers_count; j++) {
        data_producer *dp = redis_data_producer_table+j;
        char *f = dp->sflags;

        while(*f != '\0') {
            switch(*f) {
            case 'w': dp->flags |= PRO_WRITE; break;
            case 'r': dp->flags |= PRO_READONLY; break;
            case 'm': dp->flags |= PRO_DENYOOM; break;
            case 'a': dp->flags |= PRO_ADMIN; break;
            case 'p': dp->flags |= PRO_PUBSUB; break;
            case 's': dp->flags |= PRO_NOSCRIPT; break;
            case 'R': dp->flags |= PRO_RANDOM; break;
            case 'S': dp->flags |= PRO_SORT_FOR_SCRIPT; break;
            case 'l': dp->flags |= PRO_LOADING; break;
            case 't': dp->flags |= PRO_STALE; break;
            case 'M': dp->flags |= PRO_SKIP_MONITOR; break;
            case 'k': dp->flags |= PRO_ASKING; break;
            case 'F': dp->flags |= PRO_FAST; break;
            case 'A': dp->flags |= PRO_ADD; break;
            default: return VRT_ERROR;
            }
            f++;
        }

        if (delete_data_producer == NULL && 
            !strcmp(dp->name,"del")) {
            delete_data_producer = dp;
        }

        if (produce_cmd_whitelist != NULL) {
            for (k = 0; k < darray_n(produce_cmd_whitelist); k ++) {
                sds *cmdname = darray_get(produce_cmd_whitelist, k);
                if (!strcasecmp(dp->name,*cmdname)) {
                    add_to_needed_cmd_type_producer(dp);
                    break;
                }
            }
            continue;
        }

        /* Check if this is in the blacklist */
        if (produce_cmd_blacklist != NULL) {
            int is_in_blacklist = 0;
            for (k = 0; k < darray_n(produce_cmd_blacklist); k ++) {
                sds *cmdname = darray_get(produce_cmd_blacklist, k);
                if (!strcasecmp(dp->name,*cmdname)) {
                    is_in_blacklist = 1;
                    break;
                }
            }
            
            if (is_in_blacklist) {
                continue;
            }
        }

        /* Add the needed command producer */
        if (dp->cmd_type&cmd_type) {
            add_to_needed_cmd_type_producer(dp);
        }
        if (dp->cmd_type&TEST_CMD_TYPE_EXPIRE && expire_enabled) {
            add_to_needed_cmd_type_producer(dp);
        }
    }

    set_non_empty_kcps_idx();

    if (darray_n(&needed_cmd_type_producer) == 0) {
        log_error("No command need to test");
        return VRT_ERROR;
    }

    if (delete_data_producer == NULL) {
        return VRT_ERROR;
    }
    
    if (needed_cmd_type_producer_count == 0) {
        return VRT_ERROR;
    }

    for (j = 0; j < needed_cmd_type_producer_count; j ++) {
        data_producer **dp_elem = darray_get(&needed_cmd_type_producer,j);
        log_debug(LOG_INFO, "needed test command[%d]: %s", j, (*dp_elem)->name);
    }

    vrt_produce_threads_init(produce_threads_count, cached_keys, hit_ratio);
    
    return VRT_OK;
}

void vrt_produce_data_deinit(void)
{
    vrt_produce_threads_deinit();

    needed_cmd_type_producer.nelem = 0;
    darray_deinit(&needed_cmd_type_producer);
}

int vrt_start_produce_data(void)
{
    unsigned int i;
    for (i = 0; i < darray_n(&produce_threads); i ++) {
        pthread_attr_t attr;
        produce_thread *pt;
        pthread_attr_init(&attr);
        pt = darray_get(&produce_threads, i);
        pthread_create(&pt->thread_id, 
            &attr, vrt_produce_thread_run, pt);
    }
    
    last_test_begin_time = vrt_sec_now();
    return VRT_OK;
}

int vrt_wait_produce_data(void)
{
    unsigned int i;
    /* wait for the produce threads finish */
	for(i = 0; i < darray_n(&produce_threads); i ++){
		produce_thread *pt = darray_get(&produce_threads, i);
		pthread_join(pt->thread_id, NULL);
	}
    
    return VRT_OK;
}

/* -----------------------------------------------------------------------------
 * API to get key arguments from data producers
 * ---------------------------------------------------------------------------*/

/* The base case is to use the keys position as given in the data producer table
 * (firstkey, lastkey, step). */
static int *get_keys_using_data_producer_table(data_producer *dp,sds *argv, int argc, int *numkeys) {
    int j, i = 0, last, *keys;

    if (dp->firstkey == 0) {
        *numkeys = 0;
        return NULL;
    }
    last = dp->lastkey;
    if (last < 0) last = argc+last;
    keys = malloc(sizeof(int)*((last - dp->firstkey)+1));
    for (j = dp->firstkey; j <= last; j += dp->keystep) {
        keys[i++] = j;
    }
    *numkeys = i;
    return keys;
}

/* Return all the arguments that are keys in the command passed via argc / argv.
 *
 * The command returns the positions of all the key arguments inside the array,
 * so the actual return value is an heap allocated array of integers. The
 * length of the array is returned by reference into *numkeys.
 *
 * 'cmd' must be point to the corresponding entry into the redisCommand
 * table, according to the command name in argv[0].
 *
 * This function uses the command table if a command-specific helper function
 * is not required, otherwise it calls the command-specific function. */
int *get_keys_from_data_producer(data_producer *dp, sds *argv, int argc, int *numkeys) {
    if (dp->getkeys_proc) {
        return dp->getkeys_proc(dp,argv,argc,numkeys);
    } else {
        return get_keys_using_data_producer_table(dp,argv,argc,numkeys);
    }
}

sds get_one_key_from_data_unit(data_unit *du)
{
    int numkeys;
    int *keyindex;
    sds key;

    keyindex = get_keys_from_data_producer(du->dp,du->argv,du->argc,&numkeys);
    if (numkeys <= 0) {
        NOT_REACHED();
        return NULL;
    }

    key = du->argv[keyindex[0]];
    free(keyindex);

    return key;
}

void print_producer_command(data_unit *du)
{
    int j;
    sds cmd = sdsempty();
    
    for (j = 0; j < du->argc; j ++) {
        cmd = sdscatsds(cmd,du->argv[j]);
        cmd = sdscat(cmd," ");
    }
    cmd = sdscat(cmd,"\n");
    log_write_len(cmd,sdslen(cmd));
    sdsfree(cmd);
}


================================================
FILE: tests/vrt_produce_data.h
================================================
#ifndef _VRT_PRODUCE_DATA_H_
#define _VRT_PRODUCE_DATA_H_

/* Producer flags. Please check the producer table defined in the vrt_produce_data.c file
 * for more information about the meaning of every flag.
 * This is the meaning of the flags:
 *
 * w: write command (may modify the key space).
 * r: read command  (will never modify the key space).
 * m: may increase memory usage once called. Don't allow if out of memory.
 * a: admin command, like SAVE or SHUTDOWN.
 * p: Pub/Sub related command.
 * f: force replication of this command, regardless of server.dirty.
 * s: command not allowed in scripts.
 * R: random command. Command is not deterministic, that is, the same command
 *    with the same arguments, with the same key space, may have different
 *    results. For instance SPOP and RANDOMKEY are two random commands.
 * S: Sort command output array if called from script, so that the output
 *    is deterministic.
 * l: Allow command while loading the database.
 * t: Allow command while a slave has stale data but is not allowed to
 *    server this data. Normally no command is accepted in this condition
 *    but just a few.
 * M: Do not automatically propagate the command on MONITOR.
 * k: Perform an implicit ASKING for this command, so the command will be
 *    accepted in cluster mode if the slot is marked as 'importing'.
 * F: Fast command: O(1) or O(log(N)) command that should never delay
 *    its execution as long as the kernel scheduler is giving us time.
 *    Note that commands that may trigger a DEL as a side effect (like SET)
 *    are not fast commands.
 * A: Add a new key if the key was not exist before.
 */

#define PRO_WRITE 1                   /* "w" flag */
#define PRO_READONLY 2                /* "r" flag */
#define PRO_DENYOOM 4                 /* "m" flag */
#define PRO_NOT_USED_1 8              /* no longer used flag */
#define PRO_ADMIN 16                  /* "a" flag */
#define PRO_PUBSUB 32                 /* "p" flag */
#define PRO_NOSCRIPT  64              /* "s" flag */
#define PRO_RANDOM 128                /* "R" flag */
#define PRO_SORT_FOR_SCRIPT 256       /* "S" flag */
#define PRO_LOADING 512               /* "l" flag */
#define PRO_STALE 1024                /* "t" flag */
#define PRO_SKIP_MONITOR 2048         /* "M" flag */
#define PRO_ASKING 4096               /* "k" flag */
#define PRO_FAST 8192                 /* "F" flag */
#define PRO_ADD 16384                 /* "A" flag */

struct data_producer;
struct produce_scheme;
struct key_cache_array;

typedef struct data_unit *redis_command_proc(struct data_producer *dp, struct produce_scheme *ps);
typedef int *redis_get_keys_proc(struct data_producer *dp, sds *argv, int argc, int *numkeys);
typedef int produce_need_cache_key_proc(struct redisReply *reply);
typedef struct data_producer {
    char *name;     /* Command name */
    redis_command_proc *proc;
    int arity;
    
    char *sflags; /* Flags as string representation, one char per flag. */
    int flags;    /* The actual flags, obtained from the 'sflags' field. */
    
    /* Use a function to determine keys arguments in a command line. */
    redis_get_keys_proc *getkeys_proc;
    /* What keys should be loaded in background when calling this command? */
    int firstkey; /* The first argument that's a key (0 = no keys) */
    int lastkey;  /* The last argument that's a key */
    int keystep;  /* The step between first and last key */
    int cmd_type;
    produce_need_cache_key_proc *need_cache_key_proc;
} data_producer;

typedef struct data_unit {
    data_producer *dp;
    int argc;       /* Num of arguments of current command. */
    sds *argv;    /* Arguments of current command. */
    
    unsigned int hashvalue;

    void *data;
} data_unit;

typedef struct produce_scheme {
    darray *kcps;   /* Key cached pools for every type command. */

    int hit_ratio;   /* Hit ratio for the read commands. [0%,100%] */
    int hit_ratio_idx;   /* [0,hit_ratio_array_len-1] */
    int hit_ratio_array_len; /* 100 usually */
    int *hit_ratio_array;    /* Stored 0 or 1 for every element, 1 means used key in the cached keys array. */
} produce_scheme;

extern data_producer *delete_data_producer;

extern int produce_data_threads_count;

extern int produce_threads_pause_finished_count;

struct key_cache_array *kcp_get_from_ps(produce_scheme *ps, data_producer *dp);

data_unit *data_unit_get(void);
void data_unit_put(data_unit *du);

int vrt_produce_data_init(int key_length_range_min, int key_length_range_max, 
    int string_max_length,int fields_max_count,
    int produce_cmd_types,darray *produce_cmd_blacklist,darray *produce_cmd_whitelist,
    unsigned int produce_threads_count, long long cached_keys,
    int hit_ratio);
void vrt_produce_data_deinit(void);

int vrt_start_produce_data(void);
int vrt_wait_produce_data(void);

int *get_keys_from_data_producer(data_producer *dp, sds *argv, int argc, int *numkeys);

sds get_one_key_from_data_unit(data_unit *du);

void print_producer_command(data_unit *du);

#endif


================================================
FILE: tests/vrt_public.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <getopt.h>
#include <fcntl.h>
#include <errno.h>
#include <signal.h>
#include <pthread.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <hiredis.h>

#include <darray.h>
#include <dlog.h>

#include <vrt_util.h>
#include <vrt_public.h>

/* GCC version >= 4.7 */
#if defined(__ATOMIC_RELAXED)
/* GCC version >= 4.1 */
#elif defined(HAVE_ATOMIC)
#else
pthread_mutex_t state_locker = PTHREAD_MUTEX_INITIALIZER;
#endif

#define VIRE_TEST_CONFIG_DEFAULT_EXECUTE_FILE "src/vire"

static char *execute_file = VIRE_TEST_CONFIG_DEFAULT_EXECUTE_FILE;

static sds workdir = NULL;

static int vireport = 55556; /* The available port for vire to start */

void set_execute_file(char *file)
{
    execute_file = file;
}

static sds vire_conf_create(char *dir, int port)
{
    sds conf_file;
    int fd;
    sds line;
    
    conf_file = sdscatfmt(sdsempty(),"%s\/vire.conf",dir);

    fd = open(conf_file,O_WRONLY|O_CREAT|O_TRUNC,0644);
    if (fd < 0) {
        test_log_error("Open conf file %s failed: %s", conf_file, strerror(errno));
        sdsfree(conf_file);
        return NULL;
    }

    line = sdsempty();

    line = sdscatfmt(line,"port %i\n",port);
    write(fd, line, sdslen(line));

    sdsclear(line);
    line = sdscatfmt(line,"\n");
    write(fd, line, sdslen(line));
    
    close(fd);
    sdsfree(line);
    return conf_file;
}

vire_instance *vire_instance_create(int port)
{
    vire_instance *vi;

    vi = malloc(sizeof(vire_instance));
    vi->host = NULL;
    vi->port = 0;
    vi->dir = NULL;
    vi->conf_file = NULL;
    vi->pid_file = NULL;
    vi->log_file = NULL;
    vi->running = 0;
    vi->pid = -1;
    vi->ctx = NULL;

    vi->host = sdsnew("127.0.0.1");
    vi->port = port;
    vi->dir = sdscatfmt(sdsempty(),"%s\/%i",workdir,port);

    if (mkdir(vi->dir,0755) < 0) {
        vire_instance_destroy(vi);
        return NULL;
    }

    vi->conf_file = vire_conf_create(vi->dir, port);
    if (vi->conf_file == NULL) {
        vire_instance_destroy(vi);
        return NULL;
    }

    vi->pid_file = sdscatfmt(sdsempty(),"%s\/vire.pid",vi->dir);
    vi->log_file = sdscatfmt(sdsempty(),"%s\/vire.log",vi->dir);

    test_log_debug("vire host: %s", vi->host);
    test_log_debug("vire port: %d", vi->port);
    test_log_debug("vire dir: %s", vi->dir);
    test_log_debug("vire conf_file: %s", vi->conf_file);
    test_log_debug("vire pid_file: %s", vi->pid_file);
    test_log_debug("vire log_file: %s", vi->log_file);

    return vi;
}

void vire_instance_destroy(vire_instance *vi)
{
    if (vi->running) {
        vire_server_stop(vi);
    }

    if (vi->dir) {
        destroy_dir(vi->dir);
        sdsfree(vi->dir);
    }

    if (vi->conf_file) {
        sdsfree(vi->conf_file);
    }

    if (vi->pid_file) {
        sdsfree(vi->pid_file);
    }

    if (vi->log_file) {
        sdsfree(vi->log_file);
    }

    if (vi->ctx) {
        redisFree(vi->ctx);        
    }

    if (vi->host) {
        sdsfree(vi->host);
    }

    free(vi);
}

int vire_server_run(vire_instance *vi)
{
    int ret;
    pid_t pid;
    int status;
    struct timeval timeout = { 3, 500000 }; // 3.5 seconds
    
    if ((pid = fork()) < 0) {
        test_log_error("Fork a chind failed: %s", strerror(errno));
        return VRT_ERROR;
    } else if (pid == 0) {
        ret = execl(execute_file,"vire","-c",vi->conf_file,
            "-p",vi->pid_file,"-o",vi->log_file,"-v","8",NULL);
        if (ret < 0) {
            test_log_error("Execl the vire server failed: %s", strerror(errno));
            return VRT_ERROR;
        }
        return;
    }    

    sleep(1);

    ret = waitpid(pid,NULL,WNOHANG);
    if (ret != 0) {
        test_log_debug("Run vire server(port %d) failed",vi->port);
        return VRT_ERROR;
    }

    vi->ctx = redisConnectWithTimeout(vi->host,vi->port,timeout);
    if (vi->ctx == NULL || vi->ctx->err) {
        test_log_error("Connect to %s:%d failed: %s", 
            vi->host, vi->port, vi->ctx?vi->ctx->errstr:"out of memory");
        if (vi->ctx) {
            redisFree(vi->ctx);
            vi->ctx = NULL;
        }
        return VRT_ERROR;
    }

    vi->pid = get_pid_from_reply(vi->ctx,vi->host,vi->port);
    if (vi->pid < 0) {
        test_log_error("Get pid from %s:%d reply error", vi->host, vi->port);
        return VRT_ERROR;
    } else if (vi->pid != pid) {
        test_log_error("Get wrong pid from %s:%d reply", vi->host, vi->port);
        return VRT_ERROR;
    }

    test_log_debug("Run vire server(port %d) success",vi->port);

    vi->running = 1;

    return VRT_OK;
}

void vire_server_stop(vire_instance *vi)
{
    long pid;

    if (!vi->running) return;

    if (vi->pid > 0) {
        pid = vi->pid;
    } else if (vi->pid_file) {
        int fd;
        char pid_str[20];
        size_t nread;
        fd = open(vi->pid_file, O_RDONLY);
        if (fd < 0) {
            test_log_error("Open pid file %s failed", vi->pid_file);
            return;
        }
        nread = read(fd,pid_str,20);
        if (string2l(pid_str,nread,&pid) == 0) {
            test_log_error("Convert pid string %.*s to long failed",nread,pid_str);
            return;
        }
    } else {
        pid = get_pid_from_reply(vi->ctx, vi->host, vi->port);
    }

    if (pid < 0) {
        test_log_error("Get pid failed");
        return;
    }

    kill(pid,9);

    vi->running = 0;
    vi->pid = -1;
    if (vi->ctx) {
        redisFree(vi->ctx);
        vi->ctx = NULL;
    }
}

int create_work_dir(void)
{
    sds dirname;
    dirname = sdscatfmt(sdsempty(), "tmp_test_%I", vrt_usec_now());
    workdir = getAbsolutePath(dirname);
    sdsfree(dirname);

    if (create_dir(workdir) != VRT_OK) {
        test_log_error("Create workdir %s failed",workdir);
        return VRT_ERROR;
    }

    test_log_debug("Create workdir: %s",workdir);
    
    return VRT_OK;
}

int destroy_work_dir(void)
{
    if (workdir == NULL) return VRT_OK;

    if (destroy_dir(workdir) != VRT_OK) {
        test_log_error("Delete the workdir %s failed",workdir);
    } else {
        test_log_debug("Delete the workdir: %s",workdir);
    }
    
    sdsfree(workdir);
    workdir = NULL;
    
    return VRT_OK;
}

static int get_next_port(void)
{
    int port = vireport;
    vireport += 11;

    return port;
}

vire_instance *start_one_vire_instance(void)
{
    int ret;
    int retry = 0;
    vire_instance *vi;
    
    vi = vire_instance_create(get_next_port());
    if (vi == NULL) {
        return NULL;
    }
    
    ret = vire_server_run(vi);
    while (ret != VRT_OK && retry++ < 10) {
        vire_instance_destroy(vi);
        vi = vire_instance_create(get_next_port());
        if (vi == NULL) {
            return NULL;
        }
        ret = vire_server_run(vi);
    }

    if (ret != VRT_OK) {
        vire_instance_destroy(vi);
        return NULL;
    }

    return vi;
}

void show_test_result(int result,char *test_content,char *errmsg)
{
    if (result == VRT_TEST_OK) {
        test_log_out("[\033[32mOK\033[0m]: %s", test_content);
    } else if (result == VRT_TEST_ERR) {
        test_log_out("[\033[31mERR\033[0m]: %s, \033[33mfail cause: %s\033[0m", test_content, 
            (errmsg==NULL||strlen(errmsg)==0)?"unknown":errmsg);
    }
}

/************** Key cache pool implement start *************/
key_cache_array *key_cache_array_create(long long max_pool_size)
{
    long long idx;
    key_cache_array *kca;

    /* It is too small */
    if (max_pool_size < 10) return NULL;

    kca = malloc(sizeof(*kca));
    if (kca == NULL) return NULL;

    kca->cached_keys_count = 0;
    kca->ckeys_write_idx = 0;
    kca->max_pool_size = max_pool_size;
    kca->ckeys = NULL;
    pthread_mutex_init(&kca->pmutex,NULL);

    kca->ckeys = malloc(max_pool_size*sizeof(sds));
    for (idx = 0; idx < max_pool_size; idx ++) {
        kca->ckeys[idx] = sdsempty();
    }

    return kca;
}

void key_cache_array_destroy(key_cache_array *kca)
{
    long long idx;
    
    if (kca == NULL) return;

    pthread_mutex_destroy(&kca->pmutex);
    
    if (kca->ckeys) {
        for (idx = 0; idx < kca->max_pool_size; idx ++) {
            sdsfree(kca->ckeys[idx]);
        }
        free(kca->ckeys);
    }

    free(kca);
}

int key_cache_array_input(key_cache_array *kca, char *key, size_t keylen)
{
    if (kca == NULL || key == NULL || keylen == 0) return VRT_ERROR;

    pthread_mutex_lock(&kca->pmutex);
    kca->ckeys[kca->ckeys_write_idx]=sdscpylen(kca->ckeys[kca->ckeys_write_idx],key,keylen);
    kca->ckeys_write_idx++;
    if (kca->ckeys_write_idx >= kca->max_pool_size) {
        kca->ckeys_write_idx = 0;
    }
    
    if (kca->cached_keys_count < kca->max_pool_size) {
        kca->cached_keys_count++;
    }
    pthread_mutex_unlock(&kca->pmutex);
    
    return VRT_OK;
}

sds key_cache_array_random(key_cache_array *kca)
{
    unsigned int idx, randomval;
    sds key;

    if (kca == NULL) {
        return NULL;
    }

    randomval = (unsigned int)rand();
    
    pthread_mutex_lock(&kca->pmutex);
    if (kca->cached_keys_count == 0) {
        pthread_mutex_unlock(&kca->pmutex);
        return NULL;
    }

    idx = randomval%(unsigned int)kca->cached_keys_count;

    key = sdsdup(kca->ckeys[idx]);
    pthread_mutex_unlock(&kca->pmutex);
    
    return key;
}

/************** Key cache pool implement end *************/

long long get_longlong_from_info_reply(redisReply *reply, char *name)
{
    sds *lines;
    size_t line_len, len;
    int count, j;
    long long value = -1;

    len = strlen(name);
    
    if (reply->type != REDIS_REPLY_STRING) {
        test_log_error("Reply for 'info' command from vire type %d is error",
            reply->type);
        return -1;
    }

    lines = sdssplitlen(reply->str,reply->len,"\r\n",2,&count);
    if (lines == NULL) {
        test_log_error("Reply for 'info server' command from vire is error");
        return -1;
    }

    for (j = 0; j < count; j ++) {
        line_len = sdslen(lines[j]);
        if (line_len > len+1 && !strncmp(name, lines[j], len)) {
            if (string2ll(lines[j]+len+1,line_len-len-1,&value) == 0) {
                test_log_error("Convert pid string %.*s to long failed",
                    line_len-len-1,lines[j]+len+1);
                sdsfreesplitres(lines,count);
                return -1;
            }
            break;
        }
    }

    sdsfreesplitres(lines,count);
    return value;
}

redisReply *steal_hiredis_redisreply(redisReply *r)
{
    redisReply *reply;

    reply = calloc(1,sizeof(*reply));
    if (reply == NULL) {
        return NULL;
    }

    reply->type = r->type;
    reply->integer = r->integer;
    reply->len = r->len;
    reply->str = r->str;
    reply->elements = r->elements;
    reply->element = r->element;

    r->len = 0;
    r->str = NULL;
    r->elements = 0;
    r->element = NULL;

    return reply;
}

int check_two_replys_if_same(redisReply *reply1, redisReply *reply2)
{
    if (reply1 == NULL || reply2 == NULL) {
        return 1;
    }
    
    if (reply1->type != reply2->type) {
        return 1;
    }

    if (reply1->type == REDIS_REPLY_STRING || 
        reply1->type == REDIS_REPLY_STATUS ||
        reply1->type == REDIS_REPLY_ERROR) {
        if (reply1->len != reply2->len) {
            return reply1->len-reply2->len;
        }
        
        return memcmp(reply1->str, reply2->str, reply1->len);
    } else if (reply1->type == REDIS_REPLY_ARRAY) {
        size_t j;
        if (reply1->elements != reply2->elements) {
            return (reply1->elements-reply2->elements);
        }

        for (j = 0; j < reply1->elements; j ++) {
            int ret = check_two_replys_if_same(reply1->element[j], reply2->element[j]);
            if (ret != 0) return ret;
        }
        return 0;
    } else if (reply1->type == REDIS_REPLY_INTEGER) {
        return (reply1->integer-reply2->integer);
    } else if (reply1->type == REDIS_REPLY_NIL) {
        return 0;
    } else {
        test_log_error("reply type %d is error", reply1->type);
    }

    return 0;
}

struct sort_unit {
    size_t nfield;
    void **fields;
    unsigned int idx_cmp;
    int (*fcmp)(const void *,const void *);
};

static int element_cmp_multi_step(const void *ele1,const void *ele2)
{
    struct sort_unit *su1 = (struct sort_unit *)ele1, *su2 = (struct sort_unit *)ele2;

    ASSERT(su1->fcmp == su2->fcmp);
    ASSERT(su1->nfield == su2->nfield);
    ASSERT(su1->idx_cmp == su2->idx_cmp);
    ASSERT(su1->idx_cmp < su1->nfield);

    return su1->fcmp(&(su1->fields[su1->idx_cmp]),&(su2->fields[su2->idx_cmp]));
}

/* The element in the array must a pointer. */
int sort_array_by_step(void **element, size_t elements, 
    int step, int idx_cmp, int (*fcmp)(const void *,const void *))
{
    struct sort_unit *sus;
    size_t count, j, k;

    if (elements <= 1)
        return VRT_OK;

    if (step <= 0)
        return VRT_ERROR;
    
    if (step == 1) {
        qsort(element, elements, sizeof(void *), fcmp);
        return VRT_OK;
    }

    if (elements%step != 0)
        return VRT_ERROR;

    count = elements/step;
    if (count == 0)
        return VRT_ERROR;
    sus = calloc(count,sizeof(struct sort_unit));
    for (j = 0; j < count; j ++) {
        sus[j].nfield = step;
        sus[j].idx_cmp = idx_cmp;
        sus[j].fcmp = fcmp;
        sus[j].fields = malloc(step*sizeof(void*));
        for (k = 0; k < step; k ++) {
            sus[j].fields[k] = element[j*step+k];
        }
    }

    qsort(sus, count, sizeof(struct sort_unit), element_cmp_multi_step);

    for (j = 0; j < count; j ++) {
        for (k = 0; k < step; k ++) {
            element[j*step+k] = sus[j].fields[k];
        }
        free(sus[j].fields);
    }
    free(sus);
    return VRT_OK;
}

/* The reply type must be string */
int reply_string_binary_compare(const void *r1,const void *r2)
{
    redisReply *reply1 = *(redisReply **)r1, *reply2 = *(redisReply **)r2;
    int minlen;
    int cmp;

    minlen = (reply1->len < reply2->len) ? reply1->len:reply2->len;
    cmp = memcmp(reply1->str,reply2->str,minlen);
    if (cmp == 0) return reply1->len - reply2->len;
    return cmp;
}

/* command types string is like 'string,list,set,zset,hash,server,key,expire' */
int parse_command_types(char *command_types_str)
{
    int types = 0;
    sds *types_strs;
    int types_count, j;

    types_strs = sdssplitlen(command_types_str,strlen(command_types_str),",",1,&types_count);
    if (types_strs == NULL) {
        return -1;
    } else if (types_count <= 0) {
        sdsfreesplitres(types_strs,types_count);
        return -1;
    }
    
    for (j = 0; j < types_count; j ++) {
        if (!strcasecmp(types_strs[j],"string")) {
            types |= TEST_CMD_TYPE_STRING;
        } else if (!strcasecmp(types_strs[j],"list")) {
            types |= TEST_CMD_TYPE_LIST;
        } else if (!strcasecmp(types_strs[j],"set")) {
            types |= TEST_CMD_TYPE_SET;
        } else if (!strcasecmp(types_strs[j],"zset")) {
            types |= TEST_CMD_TYPE_ZSET;
        } else if (!strcasecmp(types_strs[j],"hash")) {
            types |= TEST_CMD_TYPE_HASH;
        } else if (!strcasecmp(types_strs[j],"server")) {
            types |= TEST_CMD_TYPE_SERVER;
        } else if (!strcasecmp(types_strs[j],"key")) {
            types |= TEST_CMD_TYPE_KEY;
        } else if (!strcasecmp(types_strs[j],"expire")) {
            types |= TEST_CMD_TYPE_EXPIRE;
        } else {
            sdsfreesplitres(types_strs,types_count);
            return -1;
        } 
    }

    sdsfreesplitres(types_strs,types_count);

    return types;
}

/* command list string is like 'get,set,lrange,zrange' */
darray *parse_command_list(char *command_list_str)
{
    darray *commands;
    sds *command_elem;
    sds *command_strs;
    int command_count, j;

    command_strs = sdssplitlen(command_list_str,strlen(command_list_str),",",1,&command_count);
    if (command_strs == NULL) {
        return -1;
    } else if (command_count <= 0) {
        sdsfreesplitres(command_strs,command_count);
        return -1;
    }

    commands = darray_create(command_count, sizeof(sds));
    for (j = 0; j < command_count; j ++) {
        command_elem = darray_push(commands);
        *command_elem = command_strs[j];
        command_strs[j] = NULL;
    }

    sdsfreesplitres(command_strs,command_count);

    return commands;
}

char *
get_key_type_string(int keytype)
{
    switch (keytype) {
    case REDIS_STRING:
        return "string";
        break;
    case REDIS_LIST:
        return "list";
        break;
    case REDIS_SET:
        return "set";
        break;
    case REDIS_ZSET:
        return "zset";
        break;
    case REDIS_HASH:
        return "hash";
        break;
    default:
        return "unknow";
        break;
    }

    return "unknow";
}


================================================
FILE: tests/vrt_public.h
================================================
#ifndef _VRT_PUBLIC_H_
#define _VRT_PUBLIC_H_

#ifdef HAVE_CONFIG_H
# include <config.h>
#endif

#include <dspecialconfig.h>

#include <unistd.h>

#include <hiredis.h>

struct darray;
struct key_cache_pool;

#define VRT_TEST_OK     0
#define VRT_TEST_ERR    1

#define TEST_CMD_TYPE_STRING    (1<<0)
#define TEST_CMD_TYPE_LIST      (1<<1)
#define TEST_CMD_TYPE_SET       (1<<2)
#define TEST_CMD_TYPE_ZSET      (1<<3)
#define TEST_CMD_TYPE_HASH      (1<<4)
#define TEST_CMD_TYPE_SERVER    (1<<5)
#define TEST_CMD_TYPE_KEY       (1<<6)
#define TEST_CMD_TYPE_EXPIRE    (1<<7)

/* key types */
#define REDIS_STRING    0
#define REDIS_LIST      1
#define REDIS_SET       2
#define REDIS_ZSET      3
#define REDIS_HASH      4

/* State control API */
/* GCC version >= 4.7 */
#if defined(__ATOMIC_RELAXED)
#define update_state_add(_value, _n) __atomic_add_fetch(&_value, (_n), __ATOMIC_RELAXED)
#define update_state_sub(_value, _n) __atomic_sub_fetch(&_value, (_n), __ATOMIC_RELAXED)
#define update_state_set(_value, _n) __atomic_store_n(&_value, (_n), __ATOMIC_RELAXED)
#define update_state_get(_value, _v) do {         \
    __atomic_load(&_value, _v, __ATOMIC_RELAXED); \
} while(0)

#define TEST_STATE_LOCK_TYPE "__ATOMIC_RELAXED"
/* GCC version >= 4.1 */
#elif defined(HAVE_ATOMIC)
#define update_state_add(_value, _n) __sync_add_and_fetch(&_value, (_n))
#define update_state_sub(_value, _n) __sync_sub_and_fetch(&_value, (_n))
#define update_state_set(_value, _n) __sync_lock_test_and_set(&_value, (_n))
#define update_state_get(_value, _v) do {         \
    (*_v) = __sync_add_and_fetch(&_value, 0);     \
} while(0)

#define TEST_STATE_LOCK_TYPE "HAVE_ATOMIC"
#else
extern pthread_mutex_t state_locker;

#define update_state_add(_value, _n) do {   \
    pthread_mutex_lock(&state_locker);      \
    _value += (_n);                         \
    pthread_mutex_unlock(&state_locker);    \
} while(0)

#define update_state_sub(_value, _n) do {   \
    pthread_mutex_lock(&state_locker);      \
    _value -= (_n);                         \
    pthread_mutex_unlock(&state_locker);    \
} while(0)

#define update_state_set(_value, _n) do {   \
    pthread_mutex_lock(&state_locker);      \
    _value = (_n);                          \
    pthread_mutex_unlock(&state_locker);    \
} while(0)

#define update_state_get(_value, _v) do {   \
    pthread_mutex_lock(&state_locker);      \
    (*_v) = _value;                         \
    pthread_mutex_unlock(&state_locker);    \
} while(0)

#define TEST_STATE_LOCK_TYPE "pthread_mutex_lock"
#endif

typedef struct vire_instance {
    sds host;
    int port;
    
    sds dir;
    sds conf_file;
    sds pid_file;
    sds log_file;

    int running;
    int pid;
    redisContext *ctx;
} vire_instance;

void set_execute_file(char *file);

vire_instance *vire_instance_create(int port);
void vire_instance_destroy(vire_instance *vi);

int vire_server_run(vire_instance *vi);
void vire_server_stop(vire_instance *vi);

int create_work_dir(void);
int destroy_work_dir(void);

vire_instance *start_one_vire_instance(void);

void show_test_result(int result,char *test_content,char *errmsg);

typedef struct key_cache_array {
    long long cached_keys_count;
    long long ckeys_write_idx;
    long long max_pool_size;    /* Max keys count that can be cached in the ckeys array. */
    sds *ckeys;    /* Cached keys that may exist in the target redis/vire servers. */
    pthread_mutex_t pmutex;
} key_cache_array;

key_cache_array *key_cache_array_create(long long max_pool_size);
void key_cache_array_destroy(key_cache_array *kca);
int key_cache_array_input(key_cache_array *kca, char *key, size_t keylen);
sds key_cache_array_random(key_cache_array *kca);

long long get_longlong_from_info_reply(redisReply *reply, char *name);

redisReply *steal_hiredis_redisreply(redisReply *r);
int check_two_replys_if_same(redisReply *reply1, redisReply *reply2);
int sort_array_by_step(void **element, size_t elements, int step, int idx_cmp, int (*fcmp)(const void *,const void *));
int reply_string_binary_compare(const void *r1,const void *r2);

int parse_command_types(char *command_types_str);
struct darray *parse_command_list(char *command_list_str);

char *get_key_type_string(int keytype);

#endif


================================================
FILE: tests/vrt_simple.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <getopt.h>
#include <fcntl.h>
#include <errno.h>
#include <signal.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <hiredis.h>

#include <vrt_util.h>
#include <vrt_public.h>
#include <vrt_simple.h>

#define ERRMSG_MAX_LEN LOG_MAX_LEN-100
static char errmsg[ERRMSG_MAX_LEN];

static int simple_test_cmd_get_set(vire_instance *vi)
{
    char *key = "test_cmd_get_set-key";
    char *value = "test_cmd_get_set-value";
    char *MESSAGE = "GET/SET simple test";
    redisReply * reply = NULL;
    
    reply = redisCommand(vi->ctx, "set %s %s", key, value);
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(value) || strcmp(reply->str,value)) {
        goto error;
    }
    freeReplyObject(reply);
    reply = NULL;

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_setnx(vire_instance *vi)
{
    char *key = "test_cmd_setnx-key";
    char *value = "test_cmd_setnx-value";
    char *MESSAGE = "SETNX simple test";
    redisReply * reply = NULL;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);
    
    reply = redisCommand(vi->ctx, "setnx %s %s", key, value);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 1) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(value) || strcmp(reply->str,value)) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "setnx %s %s", key, value);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 0) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';
    
    return 0;
}

static int simple_test_cmd_setex(vire_instance *vi)
{
    char *key = "test_cmd_setex-key";
    char *value = "test_cmd_setex-value";
    long long seconds = 100;
    char *MESSAGE = "SETEX simple test";
    redisReply * reply = NULL;
    
    reply = redisCommand(vi->ctx, "setex %s %lld %s", key, seconds, value);
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(value) || strcmp(reply->str,value)) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "ttl %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer > seconds ||  reply->integer < seconds - 2) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_psetex(vire_instance *vi)
{
    char *key = "test_cmd_psetex-key";
    char *value = "test_cmd_psetex-value";
    long long milliseconds = 100000;
    char *MESSAGE = "PSETEX simple test";
    redisReply * reply = NULL;
    
    reply = redisCommand(vi->ctx, "psetex %s %lld %s", key, milliseconds, value);
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(value) || strcmp(reply->str,value)) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "pttl %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer > milliseconds ||  reply->integer < milliseconds - 2000) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_incr(vire_instance *vi)
{
    char *key = "test_cmd_incr-key";
    long long n = 0, incr_times = 100;
    char *MESSAGE = "INCR simple test";
    redisReply * reply = NULL;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    while (n < incr_times) {
        reply = redisCommand(vi->ctx, "incr %s", key);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer != n+1) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "incr %lld times error", n+1);
            goto error;
        }
        freeReplyObject(reply);
        
        n ++;
    }

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING) {
        goto error;
    } else {
        long long value;
        if (!string2ll(reply->str,reply->len,&value) || value != incr_times) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "incr to %lld error, %s in fact", 
                incr_times, reply->str);
            goto error;
        }
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "set %s %s", key, "a");
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "incr %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_decr(vire_instance *vi)
{
    char *key = "test_cmd_decr-key";
    long long n = 0, decr_times = 100;
    char *MESSAGE = "DECR simple test";
    redisReply * reply = NULL;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    while (n < decr_times) {
        reply = redisCommand(vi->ctx, "decr %s", key);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer + n != -1) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "incr %lld times error", n+1);
            goto error;
        }
        freeReplyObject(reply);
        
        n ++;
    }

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING) {
        goto error;
    } else {
        long long value;
        if (!string2ll(reply->str,reply->len,&value) || value + decr_times != 0) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "decr to -%lld error, %s in fact", 
                decr_times, reply->str);
            goto error;
        }
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "set %s %s", key, "a");
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "incr %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_incrby(vire_instance *vi)
{
    char *key = "test_cmd_incrby-key";
    long long n = 0, incrby_times = 100, incrby_step = 3;
    char *MESSAGE = "INCRBY simple test";
    redisReply * reply = NULL;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    while (n < incrby_times) {
        reply = redisCommand(vi->ctx, "incrby %s %lld", key, incrby_step);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer != (n+1)*incrby_step) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "incrby %lld %lld times error", 
                incrby_step, n+1);
            goto error;
        }
        freeReplyObject(reply);
        
        n ++;
    }

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING) {
        goto error;
    } else {
        long long value;
        if (!string2ll(reply->str,reply->len,&value) || 
            value != incrby_times*incrby_step) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "incrby to %lld error, %s in fact", 
                incrby_times*incrby_step, reply->str);
            goto error;
        }
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "set %s %s", key, "a");
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "incrby %s %lld", key, incrby_step);
    if (reply == NULL || reply->type != REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_decrby(vire_instance *vi)
{
    char *key = "test_cmd_decrby-key";
    long long n = 0, decrby_times = 100, decrby_step = 3;
    char *MESSAGE = "DECRBY simple test";
    redisReply * reply = NULL;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    while (n < decrby_times) {
        reply = redisCommand(vi->ctx, "decrby %s %lld", key, decrby_step);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer + (n+1)*decrby_step != 0) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "decrby %lld %lld times error", 
                decrby_step, n+1);
            goto error;
        }
        freeReplyObject(reply);
        
        n ++;
    }

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING) {
        goto error;
    } else {
        long long value;
        if (!string2ll(reply->str,reply->len,&value) || 
            value + decrby_times*decrby_step != 0) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "decrby to -%lld error, %s in fact", 
                decrby_times*decrby_step, reply->str);
            goto error;
        }
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "set %s %s", key, "a");
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "decrby %s %lld", key, decrby_step);
    if (reply == NULL || reply->type != REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_append(vire_instance *vi)
{
    char *key = "test_cmd_append-key";
    char *final_value = "pqwpioqjqwoiuqiorueljsakhdflkqueuquewqwei[oqfiqpq-0ewrq0hdalkjz.zhjaidhfioahd";
    char *start = final_value, *pos = start, *end = final_value+strlen(final_value);
    int step = 3, len;
    char buf[20];
    char *MESSAGE = "APPEND simple test";
    redisReply * reply = NULL;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    while (pos < end) {        
        len = (end-pos >= step) ? step : (end-pos);
        memcpy(buf,pos,len);
        buf[len] = '\0';
        reply = redisCommand(vi->ctx, "append %s %s", key, buf);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER) {
            goto error;
        } else if (reply->integer != pos-start+len) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "append %s %s error", 
                key, buf);
            goto error;
        }
        freeReplyObject(reply);
        
        pos += len;
    }

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(final_value) || strcmp(reply->str,final_value)) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_strlen(vire_instance *vi)
{
    char *key = "test_cmd_strlen-key";
    char *value = "test_cmd_strlen-value";
    char *MESSAGE = "STRLEN simple test";
    redisReply * reply = NULL;
    
    reply = redisCommand(vi->ctx, "set %s %s", key, value);
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "strlen %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != strlen(value)) {
        goto error;
    }
    freeReplyObject(reply);
    reply = NULL;

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_getset(vire_instance *vi)
{
    char *key = "test_cmd_getset-key";
    char *oldvalue = "test_cmd_getset-oldvalue";
    char *newvalue = "test_cmd_getset-newvalue";
    char *MESSAGE = "GETSET simple test";
    redisReply * reply = NULL;
    
    reply = redisCommand(vi->ctx, "set %s %s", key, oldvalue);
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "getset %s %s", key, newvalue);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(oldvalue) || strcmp(reply->str,oldvalue)) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(newvalue) || strcmp(reply->str,newvalue)) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_incrbyfloat(vire_instance *vi)
{
    char *key = "test_cmd_incrbyfloat-key";
    char *final_value = "314.00000000000000022";
    long long n = 0, incrby_times = 100;
    float incrbyfloat_step = 3.14;
    char *MESSAGE = "INCRBYFLOAT simple test";
    redisReply * reply = NULL;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    while (n < incrby_times) {
        reply = redisCommand(vi->ctx, "incrbyfloat %s %f", key, incrbyfloat_step);
        if (reply == NULL || reply->type != REDIS_REPLY_STRING) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "incrbyfloat %f %lld times error", 
                incrbyfloat_step, n+1);
            goto error;
        }
        freeReplyObject(reply);
        
        n ++;
    }

    reply = redisCommand(vi->ctx, "get %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        strcmp(reply->str,final_value)) {
        vrt_scnprintf(errmsg, LOG_MAX_LEN, "incrbyfloat to %s error", final_value);
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "set %s %s", key, "a");
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "incrbyfloat %s %f", key, incrbyfloat_step);
    if (reply == NULL || reply->type != REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_getbit_setbit_bitcount(vire_instance *vi)
{
    char *key = "test_cmd_getbit_setbit_bitcount-key";
    char *MESSAGE = "GETBIT/SETBIT/BITCOUNT simple test";
    int begin = 11, step = 3, times = 79, n;
    redisReply * reply = NULL;

    n = 0;
    while(n < times) {
        reply = redisCommand(vi->ctx, "setbit %s %d 1", key, begin+n*step);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer != 0) {
            goto error;
        }
        freeReplyObject(reply);

        n ++;
    }

    n = 0;
    while(n < times) {
        reply = redisCommand(vi->ctx, "getbit %s %d", key, begin+n*step);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer != 1) {
            goto error;
        }
        freeReplyObject(reply);

        n ++;
    }

    reply = redisCommand(vi->ctx, "bitcount %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != times) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_getrange_setrange(vire_instance *vi)
{
    char *key = "test_cmd_getrange_setrange-key";
    char *MESSAGE = "GETRANGE/SETRANGE simple test";
    char *range_value = "o090pl[]m,187h";
    int begin = 11, step = 53, times = 79, n;
    redisReply * reply = NULL;

    n = 0;
    while(n < times) {
        reply = redisCommand(vi->ctx, "setrange %s %d %s", 
            key, begin+n*step, range_value);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer != begin+n*step+strlen(range_value)) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "setrange %s %d %s error", 
                key, begin+n*step, range_value);
            goto error;
        }
        freeReplyObject(reply);

        n ++;
    }

    n = 0;
    while(n < times) {
        reply = redisCommand(vi->ctx, "getrange %s %d %d", key, 
            begin+n*step, begin+n*step+strlen(range_value)-1);
        if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
            reply->len != strlen(range_value) || strcmp(reply->str, range_value)) {
            vrt_scnprintf(errmsg, LOG_MAX_LEN, "getrange %s %d %d error", 
                key, begin+n*step, begin+n*step+strlen(range_value)-1);
            goto error;
        }
        freeReplyObject(reply);

        n ++;
    }

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_bitpos(vire_instance *vi)
{
    char *key = "test_cmd_bitpos-key";
    char *MESSAGE = "BITPOS simple test";
    int pos = 11;
    redisReply * reply = NULL;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "bitpos %s 1", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != -1) {
        vrt_scnprintf(errmsg, LOG_MAX_LEN, "bitpos %s 1 first time error", 
            key);
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "setbit %s 1 0", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 0) {
        vrt_scnprintf(errmsg, LOG_MAX_LEN, "setbit %s 1 0 error", 
            key);
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "bitpos %s 1", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != -1) {
        vrt_scnprintf(errmsg, LOG_MAX_LEN, "bitpos %s 1 second time error", 
            key);
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "setbit %s %d 1", key, pos);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 0) {
        vrt_scnprintf(errmsg, LOG_MAX_LEN, "setbit %s %d 1 error", 
            key, pos);
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "bitpos %s 1", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != pos) {
        vrt_scnprintf(errmsg, LOG_MAX_LEN, "bitpos %s 1 third time error", 
            key);
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

#define MGET_MSET_KEYS_COUNT 333
static int simple_test_cmd_mget_mset(vire_instance *vi)
{
    char *key = "test_cmd_mget_mset-key";
    char *value = "test_cmd_mget_mset-value";
    char *MESSAGE = "MGET/MSET simple test";
    char keys[MGET_MSET_KEYS_COUNT][30];
    char values[MGET_MSET_KEYS_COUNT][30];
    char *argv[1+2*MGET_MSET_KEYS_COUNT];
    size_t argvlen[1+2*MGET_MSET_KEYS_COUNT];
    int j, idx;
    redisReply *reply = NULL;

    for (j = 0; j < MGET_MSET_KEYS_COUNT; j ++) {
        vrt_scnprintf(keys[j], 30,"%s%d", key, j);
        vrt_scnprintf(values[j], 30,"%s%d", value, j);
    }
    
    argv[0] = "mset";
    argvlen[0] = strlen(argv[0]);
    idx = 1;
    for (j = 0; j < MGET_MSET_KEYS_COUNT; j ++) {
        argv[idx] = keys[j];
        argvlen[idx++] = strlen(keys[j]);
        argv[idx] = values[j];
        argvlen[idx++] = strlen(values[j]);
    }
    
    reply = redisCommandArgv(vi->ctx, 1+2*MGET_MSET_KEYS_COUNT, argv, argvlen);
    if (reply == NULL || reply->type != REDIS_REPLY_STATUS || 
        reply->len != 2 || strcmp(reply->str,"OK")) {
        vrt_scnprintf(errmsg, LOG_MAX_LEN, "mset %d keys error", 
            MGET_MSET_KEYS_COUNT);
        goto error;
    }
    freeReplyObject(reply);

    argv[0] = "mget";
    argvlen[0] = strlen(argv[0]);
    for (j = 1; j < 1+MGET_MSET_KEYS_COUNT; j ++) {
        argv[j] = keys[j-1];
        argvlen[j] = strlen(argv[j]);
    }

    reply = redisCommandArgv(vi->ctx, 1+MGET_MSET_KEYS_COUNT, argv, argvlen);
    if (reply == NULL || reply->type != REDIS_REPLY_ARRAY || 
        reply->elements != MGET_MSET_KEYS_COUNT) {
        vrt_scnprintf(errmsg, LOG_MAX_LEN, "mget %d keys error", 
            MGET_MSET_KEYS_COUNT);
        goto error;
    }
    for (j = 0; j < MGET_MSET_KEYS_COUNT; j ++) {
        redisReply *reply_sub = reply->element[j];
        if (reply_sub == NULL ||
            reply_sub->type != REDIS_REPLY_STRING || 
            reply_sub->len != strlen(values[j]) || 
            strcmp(reply_sub->str, values[j]))
            goto error;
    }
    freeReplyObject(reply);
    reply = NULL;

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

#define TEST_HASH_ENCODED_ZIPLIST    0
#define TEST_HASH_ENCODED_HT         1
#define TEST_HASH_ENCODED_CAUSED_BY_FILED    0
#define TEST_HASH_ENCODED_CAUSED_BY_VALUE    1
#define TEST_HASH_ENCODED_CAUSED_BY_ALL      2
#define TEST_HASH_ENCODED_ZIPLIST_FIELD_COUNT    56
#define TEST_HASH_ENCODED_HT_FIELD_COUNT         678
#define TEST_HASH_ENCODED_ZIPLIST_VALUE_LEN      21
#define TEST_HASH_ENCODED_HT_VALUE_LEN           111

struct test_hash_member {
    char *field;
    char *value;
};

static int test_hash_member_length(struct test_hash_member **thms)
{
    int j = 0;
    while (thms[j]) {
        j ++;
    }
    return j;
}

static void test_hash_members_destroy(struct test_hash_member **thms)
{
    int j = 0;
    while (thms[j]) {
        free(thms[j]->field);
        free(thms[j]->value);
        free(thms[j]);
        j ++;
    }
    free(thms);
}

static struct test_hash_member **simple_test_hash_init(vire_instance *vi, char *key, int hash_encode, int encode_cause)
{
    char *field = "test_hash-field";
    char *value = "test_hash-value";
    int field_count, value_len;
    int j,n;
    struct test_hash_member **thms = NULL;
    redisReply *reply = NULL;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);

    if (hash_encode == TEST_HASH_ENCODED_ZIPLIST) {
        field_count = TEST_HASH_ENCODED_ZIPLIST_FIELD_COUNT;
        value_len = TEST_HASH_ENCODED_ZIPLIST_VALUE_LEN;
    } else if (encode_cause == TEST_HASH_ENCODED_CAUSED_BY_FILED) {
        field_count = TEST_HASH_ENCODED_HT_FIELD_COUNT;
        value_len = TEST_HASH_ENCODED_ZIPLIST_VALUE_LEN;
    } else if (encode_cause == TEST_HASH_ENCODED_CAUSED_BY_VALUE) {
        field_count = TEST_HASH_ENCODED_ZIPLIST_FIELD_COUNT;
        value_len = TEST_HASH_ENCODED_HT_VALUE_LEN;
    } else if (encode_cause == TEST_HASH_ENCODED_CAUSED_BY_ALL) {
        field_count = TEST_HASH_ENCODED_HT_FIELD_COUNT;
        value_len = TEST_HASH_ENCODED_HT_VALUE_LEN;
    }
    
    thms = malloc((field_count+1)*sizeof(struct test_hash_member*));
    for (j = 0; j < field_count; j ++) {
        thms[j] = malloc(sizeof(struct test_hash_member));
        thms[j]->field = malloc(30*sizeof(char));
        thms[j]->value = malloc((value_len+1)*sizeof(char));
        vrt_scnprintf(thms[j]->field, 30, "%s%d", field, j);
        n = vrt_scnprintf(thms[j]->value, value_len, "%s%d", value, j);
        if (n < value_len) {
            memset(thms[j]->value,'x',value_len-n);
            thms[j]->value[value_len] = '\0';
        }
    }
    thms[field_count] = NULL;

    for (j = 0; j < field_count; j ++) { 
        reply = redisCommand(vi->ctx, "hset %s %s %s", 
            key, thms[j]->field, thms[j]->value);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer != 1) {
            goto error;
        }
        freeReplyObject(reply);
    }

    reply = redisCommand(vi->ctx, "hlen %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != field_count) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "object encoding %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING) {
        goto error;
    } else {
        if (hash_encode == TEST_HASH_ENCODED_ZIPLIST) {
            if(reply->len != 7 || strcmp(reply->str, "ziplist")) {
                goto error;
            }
        } else {
            if(reply->len != 9 || strcmp(reply->str, "hashtable")) {
                goto error;
            }
        }
    }
    freeReplyObject(reply);
    
    return thms;

error:

    if (thms) {
        test_hash_members_destroy(thms);
        thms = NULL;
    }

    if (reply) freeReplyObject(reply);

    return NULL;
}

static int simple_test_hash_encode(vire_instance *vi)
{
    char *key = "test_hash_encode";
    char *MESSAGE = "HASH ENCODE simple test";
    struct test_hash_member **thms;
    
    thms = simple_test_hash_init(vi,key,TEST_HASH_ENCODED_ZIPLIST,TEST_HASH_ENCODED_CAUSED_BY_FILED);
    if (thms == NULL) {
        goto error;
    }
    test_hash_members_destroy(thms);
    thms = simple_test_hash_init(vi,key,TEST_HASH_ENCODED_ZIPLIST,TEST_HASH_ENCODED_CAUSED_BY_VALUE);
    if (thms == NULL) {
        goto error;
    }
    test_hash_members_destroy(thms);
    thms = simple_test_hash_init(vi,key,TEST_HASH_ENCODED_HT,TEST_HASH_ENCODED_CAUSED_BY_FILED);
    if (thms == NULL) {
        goto error;
    }
    test_hash_members_destroy(thms);
    thms = simple_test_hash_init(vi,key,TEST_HASH_ENCODED_HT,TEST_HASH_ENCODED_CAUSED_BY_VALUE);
    if (thms == NULL) {
        goto error;
    }
    test_hash_members_destroy(thms);
    thms = simple_test_hash_init(vi,key,TEST_HASH_ENCODED_HT,TEST_HASH_ENCODED_CAUSED_BY_ALL);
    if (thms == NULL) {
        goto error;
    }
    test_hash_members_destroy(thms);
    
    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_hget_hset(vire_instance *vi)
{
    char *key = "test_cmd_hget_hset-key";
    char *field = "test_cmd_hget_hset-field";
    char *value = "test_cmd_hget_hset-value";
    char *MESSAGE = "HGET/HSET simple test";
    redisReply * reply = NULL;
    struct test_hash_member **thms = NULL;
    int idx;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);
    
    reply = redisCommand(vi->ctx, "hset %s %s %s", key, field, value);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 1) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "hget %s %s", key, field);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(value) || strcmp(reply->str,value)) {
        goto error;
    }
    freeReplyObject(reply);

    thms = simple_test_hash_init(vi,key,TEST_HASH_ENCODED_HT,TEST_HASH_ENCODED_CAUSED_BY_FILED);
    if (thms == NULL) {
        goto error;
    }
    reply = redisCommand(vi->ctx, "hset %s %s %s", key, field, value);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 1) {
        goto error;
    }
    freeReplyObject(reply);
    reply = redisCommand(vi->ctx, "hget %s %s", key, field);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(value) || strcmp(reply->str,value)) {
        goto error;
    }
    freeReplyObject(reply);
    idx = test_hash_member_length(thms)/2;
    reply = redisCommand(vi->ctx, "hget %s %s", key, thms[idx]->field);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(thms[idx]->value) || strcmp(reply->str,thms[idx]->value)) {
        goto error;
    }
    freeReplyObject(reply);
    test_hash_members_destroy(thms);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);
    if (thms) test_hash_members_destroy(thms);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_hlen(vire_instance *vi)
{
    char *key = "test_cmd_hlen-key";
    char *field = "test_cmd_hlen-field";
    char *value = "test_cmd_hlen-value";
    char *MESSAGE = "HLEN simple test";
    redisReply * reply = NULL;
    int hash_len, j;

    hash_len = 51;
    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);
    for (j = 0; j < hash_len; j ++) {
        reply = redisCommand(vi->ctx, "hset %s %s%d %s", key, field, j, value);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer != 1) {
            goto error;
        }
        freeReplyObject(reply);
    }
    reply = redisCommand(vi->ctx, "hlen %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != hash_len) {
        goto error;
    }
    freeReplyObject(reply);

    hash_len = 5111;
    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);
    for (j = 0; j < hash_len; j ++) {
        reply = redisCommand(vi->ctx, "hset %s %s%d %s", key, field, j, value);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
            reply->integer != 1) {
            goto error;
        }
        freeReplyObject(reply);
    }
    reply = redisCommand(vi->ctx, "hlen %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != hash_len) {
        goto error;
    }
    freeReplyObject(reply);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_hdel(vire_instance *vi)
{
    char *key = "test_cmd_hdel-key";
    char *field = "test_cmd_hdel-field";
    char *value = "test_cmd_hdel-value";
    char *MESSAGE = "HDEL simple test";
    redisReply * reply = NULL;
    struct test_hash_member **thms = NULL;
    int idx;

    reply = redisCommand(vi->ctx, "del %s", key);
    if (reply == NULL || reply->type == REDIS_REPLY_ERROR) {
        goto error;
    }
    freeReplyObject(reply);
    
    reply = redisCommand(vi->ctx, "hset %s %s%d %s", key, field, 1, value);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 1) {
        goto error;
    }
    freeReplyObject(reply);
    reply = redisCommand(vi->ctx, "hset %s %s%d %s", key, field, 2, value);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 1) {
        goto error;
    }
    freeReplyObject(reply);

    reply = redisCommand(vi->ctx, "hget %s %s%d", key, field, 1);
    if (reply == NULL || reply->type != REDIS_REPLY_STRING || 
        reply->len != strlen(value) || strcmp(reply->str, value)) {
        goto error;
    }
    freeReplyObject(reply);
    reply = redisCommand(vi->ctx, "hdel %s %s%d", key, field, 1);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 1) {
        goto error;
    }
    freeReplyObject(reply);
    reply = redisCommand(vi->ctx, "hget %s %s%d", key, field, 1);
    if (reply == NULL || reply->type != REDIS_REPLY_NIL) {
        goto error;
    }
    freeReplyObject(reply);
    
    reply = redisCommand(vi->ctx, "hdel %s %s%d", key, field, 2);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 1) {
        goto error;
    }
    freeReplyObject(reply);
    reply = redisCommand(vi->ctx, "exists %s", key);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 0) {
        goto error;
    }
    freeReplyObject(reply);
    
    thms = simple_test_hash_init(vi,key,TEST_HASH_ENCODED_HT,TEST_HASH_ENCODED_CAUSED_BY_FILED);
    if (thms == NULL) {
        goto error;
    }
    idx = test_hash_member_length(thms)/2;
    reply = redisCommand(vi->ctx, "hdel %s %s", key, thms[idx]->field);
    if (reply == NULL || reply->type != REDIS_REPLY_INTEGER || 
        reply->integer != 1) {
        goto error;
    }
    freeReplyObject(reply);    
    reply = redisCommand(vi->ctx, "hget %s %s", key, thms[idx]->field);
    if (reply == NULL || reply->type != REDIS_REPLY_NIL) {
        goto error;
    }
    freeReplyObject(reply);
    test_hash_members_destroy(thms);

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);
    if (thms) test_hash_members_destroy(thms);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

static int simple_test_cmd_pfadd_pfcount(vire_instance *vi)
{
    char *key = "test_cmd_pfadd_pfcount-key";
    char *value = "test_cmd_pfadd_pfcount-value";
    char *MESSAGE = "PFADD/PFCOUNT simple test";
    redisReply * reply = NULL;
    int n = 0, count = 20329, repeat;

    while (repeat < 2) {
        int expect_count;
        reply = redisCommand(vi->ctx, "pfadd %s %s%d", key, value, n++);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER) {
            goto error;
        }
        freeReplyObject(reply);
        if (n >= count) {
            repeat++;
            n = 0;
        }

        if (repeat == 0) {
            expect_count = n;
        } else {
            expect_count = count;
        }
        
        reply = redisCommand(vi->ctx, "pfcount %s", key);
        if (reply == NULL || reply->type != REDIS_REPLY_INTEGER) {
            goto error;
        }
        if (reply->integer != (long long)expect_count) {
            float mistake = ((float)expect_count-(float)reply->integer)/(float)expect_count;
            if (mistake < -0.02 || mistake > 0.02) {
                vrt_scnprintf(errmsg, LOG_MAX_LEN, "pfadd %d different elements is not approximated pfcount returned %lld, mistake %f", 
                    expect_count, reply->integer, mistake);
                goto error;
            }
        }
        freeReplyObject(reply);
    }

    show_test_result(VRT_TEST_OK,MESSAGE,errmsg);

    return 1;

error:

    if (reply) freeReplyObject(reply);

    show_test_result(VRT_TEST_ERR,MESSAGE,errmsg);
    errmsg[0] = '\0';

    return 0;
}

int simple_test(void)
{
    vire_instance *vi;
    int ok_count = 0, all_count = 0;
    
    vi = start_one_vire_instance();
    if (vi == NULL) {
        test_log_error("Run vire instance failed");
        return;
    }

    errmsg[0] = '\0';

    /* String */
    ok_count+=simple_test_cmd_get_set(vi); all_count++;
    ok_count+=simple_test_cmd_setnx(vi); all_count++;
    ok_count+=simple_test_cmd_setex(vi); all_count++;
    ok_count+=simple_test_cmd_psetex(vi); all_count++;
    ok_count+=simple_test_cmd_incr(vi); all_count++;
    ok_count+=simple_test_cmd_decr(vi); all_count++;
    ok_count+=simple_test_cmd_incrby(vi); all_count++;
    ok_count+=simple_test_cmd_decrby(vi); all_count++;
    ok_count+=simple_test_cmd_append(vi); all_count++;
    ok_count+=simple_test_cmd_strlen(vi); all_count++;
    ok_count+=simple_test_cmd_getset(vi); all_count++;
    ok_count+=simple_test_cmd_incrbyfloat(vi); all_count++;
    ok_count+=simple_test_cmd_getbit_setbit_bitcount(vi); all_count++;
    ok_count+=simple_test_cmd_getrange_setrange(vi); all_count++;
    ok_count+=simple_test_cmd_bitpos(vi); all_count++;
    ok_count+=simple_test_cmd_mget_mset(vi); all_count++;
    /* Hash */
    ok_count+=simple_test_hash_encode(vi); all_count++;
    ok_count+=simple_test_cmd_hget_hset(vi); all_count++;
    ok_count+=simple_test_cmd_hlen(vi); all_count++;
    ok_count+=simple_test_cmd_hdel(vi); all_count++;
    /* HyperLogLog */
    ok_count+=simple_test_cmd_pfadd_pfcount(vi); all_count++;
    
    vire_instance_destroy(vi);

    return ok_count==all_count?1:0;
}


================================================
FILE: tests/vrt_simple.h
================================================
#ifndef _VRT_SIMPLE_H_
#define _VRT_SIMPLE_H_

int simple_test(void);


#endif


================================================
FILE: tests/vrt_util.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <stdint.h>
#include <errno.h>
#include <fcntl.h>
#include <unistd.h>
#include <dirent.h>
#include <string.h>
#include <ctype.h>
#include <limits.h>
#include <sys/stat.h>
#include <sys/types.h>

#include <hiredis.h>

#include <vrt_util.h>

void
vrt_assert(const char *cond, const char *file, int line, int panic)
{
    test_log_error("assert '%s' failed @ (%s, %d)", cond, file, line);
    if (panic) {
        abort();
    }
}

int
vrt_vscnprintf(char *buf, size_t size, const char *fmt, va_list args)
{
    int n;

    n = vsnprintf(buf, size, fmt, args);

    /*
     * The return value is the number of characters which would be written
     * into buf not including the trailing '\0'. If size is == 0 the
     * function returns 0.
     *
     * On error, the function also returns 0. This is to allow idiom such
     * as len += _vscnprintf(...)
     *
     * See: http://lwn.net/Articles/69419/
     */
    if (n <= 0) {
        return 0;
    }

    if (n < (int) size) {
        return n;
    }

    return (int)(size - 1);
}

int
vrt_scnprintf(char *buf, size_t size, const char *fmt, ...)
{
    va_list args;
    int n;

    va_start(args, fmt);
    n = vrt_vscnprintf(buf, size, fmt, args);
    va_end(args);

    return n;
}

void
_test_log_error(const char *file, int line, const char *fmt, ...)
{
    int len, size, errno_save;
    char buf[LOG_MAX_LEN];
    va_list args;
    
    errno_save = errno;
    len = 0;            /* length of output buffer */
    size = LOG_MAX_LEN; /* size of output buffer */
    
    len += vrt_scnprintf(buf + len, size - len, "%s:%d ", file, line);

    va_start(args, fmt);
    len += vsnprintf(buf + len, size - len, fmt, args);
    va_end(args);

    buf[len++] = '\n';

    write(STDERR_FILENO, buf, len);
    
    errno = errno_save;
}

void
_test_log_out(const char *fmt, ...)
{
    int len, size, errno_save;
    char buf[LOG_MAX_LEN];
    va_list args;
    
    errno_save = errno;
    len = 0;            /* length of output buffer */
    size = LOG_MAX_LEN; /* size of output buffer */

    va_start(args, fmt);
    len += vsnprintf(buf + len, size - len, fmt, args);
    va_end(args);

    buf[len++] = '\n';

    write(STDOUT_FILENO, buf, len);
    
    errno = errno_save;
}

/*
 * Return the current time in microseconds since Epoch
 */
int64_t
vrt_usec_now(void)
{
    struct timeval now;
    int64_t usec;
    int status;

    status = gettimeofday(&now, NULL);
    if (status < 0) {
        return -1;
    }

    usec = (int64_t)now.tv_sec * 1000000LL + (int64_t)now.tv_usec;

    return usec;
}

/*
 * Return the current time in milliseconds since Epoch
 */
int64_t
vrt_msec_now(void)
{
    return vrt_usec_now() / 1000LL;
}

/*
 * Return the current time in seconds since Epoch
 */
int64_t
vrt_sec_now(void)
{
    return vrt_usec_now() / 1000000LL;
}

/* Given the filename, return the absolute path as an SDS string, or NULL
 * if it fails for some reason. Note that "filename" may be an absolute path
 * already, this will be detected and handled correctly.
 *
 * The function does not try to normalize everything, but only the obvious
 * case of one or more "../" appearning at the start of "filename"
 * relative path. */
sds getAbsolutePath(char *filename) {
    char cwd[1024];
    sds abspath;
    sds relpath = sdsnew(filename);

    sdstrim(relpath," \r\n\t");
    if (relpath[0] == '/') return relpath; /* Path is already absolute. */

    /* If path is relative, join cwd and relative path. */
    if (getcwd(cwd,sizeof(cwd)) == NULL) {
        sdsfree(relpath);
        return NULL;
    }
    abspath = sdsnew(cwd);
    if (sdslen(abspath) && abspath[sdslen(abspath)-1] != '/')
        abspath = sdscat(abspath,"/");

    /* At this point we have the current path always ending with "/", and
     * the trimmed relative path. Try to normalize the obvious case of
     * trailing ../ elements at the start of the path.
     *
     * For every "../" we find in the filename, we remove it and also remove
     * the last element of the cwd, unless the current cwd is "/". */
    while (sdslen(relpath) >= 3 &&
           relpath[0] == '.' && relpath[1] == '.' && relpath[2] == '/')
    {
        sdsrange(relpath,3,-1);
        if (sdslen(abspath) > 1) {
            char *p = abspath + sdslen(abspath)-2;
            int trimlen = 1;

            while(*p != '/') {
                p--;
                trimlen++;
            }
            sdsrange(abspath,0,-(trimlen+1));
        }
    }

    /* Finally glue the two parts together. */
    abspath = sdscatsds(abspath,relpath);
    sdsfree(relpath);
    return abspath;
}

/* Return the number of digits of 'v' when converted to string in radix 10.
 * See ll2string() for more information. */
uint32_t digits10(uint64_t v) {
    if (v < 10) return 1;
    if (v < 100) return 2;
    if (v < 1000) return 3;
    if (v < 1000000000000UL) {
        if (v < 100000000UL) {
            if (v < 1000000) {
                if (v < 10000) return 4;
                return 5 + (v >= 100000);
            }
            return 7 + (v >= 10000000UL);
        }
        if (v < 10000000000UL) {
            return 9 + (v >= 1000000000UL);
        }
        return 11 + (v >= 100000000000UL);
    }
    return 12 + digits10(v / 1000000000000UL);
}

/* Like digits10() but for signed values. */
uint32_t sdigits10(int64_t v) {
    if (v < 0) {
        /* Abs value of LLONG_MIN requires special handling. */
        uint64_t uv = (v != LLONG_MIN) ?
                      (uint64_t)-v : ((uint64_t) LLONG_MAX)+1;
        return digits10(uv)+1; /* +1 for the minus. */
    } else {
        return digits10(v);
    }
}

/* Convert a long long into a string. Returns the number of
 * characters needed to represent the number.
 * If the buffer is not big enough to store the string, 0 is returned.
 *
 * Based on the following article (that apparently does not provide a
 * novel approach but only publicizes an already used technique):
 *
 * https://www.facebook.com/notes/facebook-engineering/three-optimization-tips-for-c/10151361643253920
 *
 * Modified in order to handle signed integers since the original code was
 * designed for unsigned integers. */
int ll2string(char* dst, size_t dstlen, long long svalue) {
    static const char digits[201] =
        "0001020304050607080910111213141516171819"
        "2021222324252627282930313233343536373839"
        "4041424344454647484950515253545556575859"
        "6061626364656667686970717273747576777879"
        "8081828384858687888990919293949596979899";
    int negative;
    unsigned long long value;

    /* The main loop works with 64bit unsigned integers for simplicity, so
     * we convert the number here and remember if it is negative. */
    if (svalue < 0) {
        if (svalue != LLONG_MIN) {
            value = -svalue;
        } else {
            value = ((unsigned long long) LLONG_MAX)+1;
        }
        negative = 1;
    } else {
        value = svalue;
        negative = 0;
    }

    /* Check length. */
    uint32_t const length = digits10(value)+negative;
    if (length >= dstlen) return 0;

    /* Null term. */
    uint32_t next = length;
    dst[next] = '\0';
    next--;
    while (value >= 100) {
        int const i = (value % 100) * 2;
        value /= 100;
        dst[next] = digits[i + 1];
        dst[next - 1] = digits[i];
        next -= 2;
    }

    /* Handle last 1-2 digits. */
    if (value < 10) {
        dst[next] = '0' + (uint32_t) value;
    } else {
        int i = (uint32_t) value * 2;
        dst[next] = digits[i + 1];
        dst[next - 1] = digits[i];
    }

    /* Add sign. */
    if (negative) dst[0] = '-';
    return length;
}

/* Convert a string into a long long. Returns 1 if the string could be parsed
 * into a (non-overflowing) long long, 0 otherwise. The value will be set to
 * the parsed value when appropriate. */
int string2ll(const char *s, size_t slen, long long *value) {
    const char *p = s;
    size_t plen = 0;
    int negative = 0;
    unsigned long long v;

    if (plen == slen)
        return 0;

    /* Special case: first and only digit is 0. */
    if (slen == 1 && p[0] == '0') {
        if (value != NULL) *value = 0;
        return 1;
    }

    if (p[0] == '-') {
        negative = 1;
        p++; plen++;

        /* Abort on only a negative sign. */
        if (plen == slen)
            return 0;
    }

    /* First digit should be 1-9, otherwise the string should just be 0. */
    if (p[0] >= '1' && p[0] <= '9') {
        v = p[0]-'0';
        p++; plen++;
    } else if (p[0] == '0' && slen == 1) {
        *value = 0;
        return 1;
    } else {
        return 0;
    }

    while (plen < slen && p[0] >= '0' && p[0] <= '9') {
        if (v > (ULLONG_MAX / 10)) /* Overflow. */
            return 0;
        v *= 10;

        if (v > (ULLONG_MAX - (p[0]-'0'))) /* Overflow. */
            return 0;
        v += p[0]-'0';

        p++; plen++;
    }

    /* Return if not all bytes were used. */
    if (plen < slen)
        return 0;

    if (negative) {
        if (v > ((unsigned long long)(-(LLONG_MIN+1))+1)) /* Overflow. */
            return 0;
        if (value != NULL) *value = -v;
    } else {
        if (v > LLONG_MAX) /* Overflow. */
            return 0;
        if (value != NULL) *value = v;
    }
    return 1;
}

/* Convert a string into a long. Returns 1 if the string could be parsed into a
 * (non-overflowing) long, 0 otherwise. The value will be set to the parsed
 * value when appropriate. */
int string2l(const char *s, size_t slen, long *lval) {
    long long llval;

    if (!string2ll(s,slen,&llval))
        return 0;

    if (llval < LONG_MIN || llval > LONG_MAX)
        return 0;

    *lval = (long)llval;
    return 1;
}

/* Convert a double to a string representation. Returns the number of bytes
 * required. The representation should always be parsable by strtod(3). */
int d2string(char *buf, size_t len, double value) {
    if (isnan(value)) {
        len = snprintf(buf,len,"nan");
    } else if (isinf(value)) {
        if (value < 0)
            len = snprintf(buf,len,"-inf");
        else
            len = snprintf(buf,len,"inf");
    } else if (value == 0) {
        /* See: http://en.wikipedia.org/wiki/Signed_zero, "Comparisons". */
        if (1.0/value < 0)
            len = snprintf(buf,len,"-0");
        else
            len = snprintf(buf,len,"0");
    } else {
#if (DBL_MANT_DIG >= 52) && (LLONG_MAX == 0x7fffffffffffffffLL)
        /* Check if the float is in a safe range to be casted into a
         * long long. We are assuming that long long is 64 bit here.
         * Also we are assuming that there are no implementations around where
         * double has precision < 52 bit.
         *
         * Under this assumptions we test if a double is inside an interval
         * where casting to long long is safe. Then using two castings we
         * make sure the decimal part is zero. If all this is true we use
         * integer printing function that is much faster. */
        double min = -4503599627370495; /* (2^52)-1 */
        double max = 4503599627370496; /* -(2^52) */
        if (value > min && value < max && value == ((double)((long long)value)))
            len = ll2string(buf,len,(long long)value);
        else
#endif
            len = snprintf(buf,len,"%.17g",value);
    }

    return len;
}

int create_dir(char *path)
{
    if (mkdir(path,0755) < 0) {
        return VRT_ERROR;
    }

    return VRT_OK;
}

int destroy_dir(char *path)
{  
    DIR *dp;
    struct dirent *entry;
    struct stat statbuf;
    char cwd[1024];

    if (getcwd(cwd,sizeof(cwd)) == NULL) {
        return VRT_ERROR;
    }
    
    if ((dp = opendir(path)) == NULL) {  
        test_log_error("Can't open dir: %s", path);  
        return VRT_ERROR;  
    }
    
    chdir (path);
    while ((entry = readdir(dp)) != NULL) {
        lstat(entry->d_name, &statbuf);
        if (S_IFDIR & statbuf.st_mode) {
            if (strcmp(".", entry->d_name) == 0 || strcmp("..", entry->d_name) == 0)
                continue;

            destroy_dir(entry->d_name);
        } else {
            remove(entry->d_name);
        }
    }
    
    chdir(cwd);
    closedir(dp);

    remove(path);
    return VRT_OK;
}

int get_pid_from_reply(redisContext *redisctx, char *host, int port)
{
    redisContext *ctx = redisctx;
    redisReply * reply;
    sds *lines;
    size_t line_len;
    int count, j;
    int pid = -1;
    
    if (ctx == NULL) {
        ctx = redisConnect(host,port);
    }

    if (ctx == NULL) {
        test_log_error("Get pid from instance failed: can't connect to %s:%d",host,port);
        return -1;
    }

    reply = redisCommand(ctx, "info server");
    if (reply == NULL) {
        test_log_error("Execute 'info server' command on vire failed: %s\n",
            ctx->err?ctx->errstr:"");
        if (redisctx == NULL) redisFree(ctx);
        return -1;
    }

    if (reply->type != REDIS_REPLY_STRING) {
        test_log_error("Reply for 'info server' command from vire type %d is error",
            reply->type);
        if (redisctx == NULL) redisFree(ctx);
        freeReplyObject(reply);
        return -1;
    }

    lines = sdssplitlen(reply->str,reply->len,"\r\n",2,&count);
    if (lines == NULL) {
        test_log_error("Reply for 'info server' command from vire is error");
        if (redisctx == NULL) redisFree(ctx);
        freeReplyObject(reply);
        return -1;
    }

    for (j = 0; j < count; j ++) {
        line_len = sdslen(lines[j]);
        if (line_len > 11 && !strncmp("process_id", lines[j], 10)) {
            if (string2l(lines[j]+11,line_len-11,&pid) == 0) {
                test_log_error("Convert pid string %.*s to long failed",
                    line_len-11,lines[j]+11);
                sdsfreesplitres(lines,count);
                if (redisctx == NULL) redisFree(ctx);
                freeReplyObject(reply);
                return -1;
            }
            break;
        }
    }

    sdsfreesplitres(lines,count);
    if (redisctx == NULL) redisFree(ctx);
    freeReplyObject(reply);

    return pid;
}

/* Range is like 0-100 or just 10. 
  * So the count must be 1 or 2. */
long long *get_range_from_string(char *str, size_t len, int *count)
{
    int elem_count;
    sds *elems;
    long long value;
    long long *range;
    
    elems = sdssplitlen(optarg,strlen(optarg),"-",1,&elem_count);
    if (elems == NULL) {
        goto error;
    } else if (elem_count <= 0 || elem_count >= 3) {
        sdsfreesplitres(elems,elem_count);
        goto error;
    }

    if (elem_count == 1) {
        if (string2ll(elems[0],sdslen(elems[0]),&value) != 1) {
            sdsfreesplitres(elems,elem_count);
            goto error;
        }

        range = malloc(1*sizeof(*range));
        range[0] = value;
        *count = 1;
    } else if (elem_count == 2) {
        if (string2ll(elems[0],sdslen(elems[0]),&value) != 1) {
            sdsfreesplitres(elems,elem_count);
            goto error;
        }
        
        range = malloc(2*sizeof(*range));
        range[0] = value;

        if (string2ll(elems[1],sdslen(elems[1]),&value) != 1) {
            sdsfreesplitres(elems,elem_count);
            free(range);
            goto error;
        }

        range[1] = value;
        *count = 2;

        if (range[0] > range[1]) {
            sdsfreesplitres(elems,elem_count);
            free(range);
            goto error;
        }
    }

    sdsfreesplitres(elems,elem_count);

    return range;

error:

    *count = -1;
    return NULL;
}

sds get_host_port_from_address_string(char *address, int *port)
{
    sds *host_port;
    int count = 0;
    sds host;
    long value;

    *port = 0;
    
    host_port = sdssplitlen(address,strlen(address),":",1,&count);
    if (host_port == NULL) {
        return NULL;
    } else if (count != 2) {
        sdsfreesplitres(host_port,count);
        return NULL;
    }

    if (string2l(host_port[1],sdslen(host_port[1]),&value) != 1 || 
        value <= 0 || value >= 65535) {
        sdsfreesplitres(host_port,count);
        return NULL;
    }

    *port = (int)value;
    host = host_port[0];
    host_port[0] = NULL;
    sdsfreesplitres(host_port,count);
    
    return host;
}


================================================
FILE: tests/vrt_util.h
================================================
#ifndef _VRT_UTIL_H_
#define _VRT_UTIL_H_

#ifdef HAVE_CONFIG_H
# include <config.h>
#endif

#ifdef HAVE_DEBUG_LOG
# define VRT_DEBUG_LOG 1
#endif

#include <dspecialconfig.h>

#include <sds.h>

#define VRT_OK        0
#define VRT_ERROR    -1

#define VRT_UINT8_MAXLEN     (3 + 1)
#define VRT_UINT16_MAXLEN    (5 + 1)
#define VRT_UINT32_MAXLEN    (10 + 1)
#define VRT_UINT64_MAXLEN    (20 + 1)
#define VRT_UINTMAX_MAXLEN   VRT_UINT64_MAXLEN

#define VRT_MAXHOSTNAMELEN   256

#define LF                  (uint8_t) 10
#define CR                  (uint8_t) 13
#define CRLF                "\x0d\x0a"
#define CRLF_LEN            (sizeof("\x0d\x0a") - 1)

#define LOG_MAX_LEN 256 /* max length of log message */

void _test_log_error(const char *file, int line, const char *fmt, ...);
void _test_log_out(const char *fmt, ...);
#if defined(VRT_DEBUG_LOG)
#define test_log_debug(...) do {                              \
    _test_log_error(__FILE__, __LINE__, __VA_ARGS__);         \
} while (0)
#else
#define test_log_debug(...)
#endif
#define test_log_error(...) do {                              \
    _test_log_error(__FILE__, __LINE__, __VA_ARGS__);         \
} while (0)
#define test_log_out(...) do {                                \
    _test_log_out(__VA_ARGS__);                               \
} while (0)

void vrt_assert(const char *cond, const char *file, int line, int panic);

#define ASSERT(_x) do {                         \
    if (!(_x)) {                                \
        vrt_assert(#_x, __FILE__, __LINE__, 1);  \
    }                                           \
} while (0)

int vrt_scnprintf(char *buf, size_t size, const char *fmt, ...);

int64_t vrt_usec_now(void);
int64_t vrt_msec_now(void);
int64_t vrt_sec_now(void);

sds getAbsolutePath(char *filename);

int ll2string(char* dst, size_t dstlen, long long svalue);
int string2ll(const char *s, size_t slen, long long *value);
int string2l(const char *s, size_t slen, long *lval);
int d2string(char *buf, size_t len, double value);

int create_dir(char *path);
int destroy_dir(char *dir);

int get_pid_from_reply(struct redisContext *redisctx, char *host, int port);

long long *get_range_from_string(char *str, size_t len, int *count);

sds get_host_port_from_address_string(char *address, int *port);

#endif


================================================
FILE: tests/vrtest.c
================================================
#include <stdio.h>
#include <stdlib.h>
#include <getopt.h>
#include <fcntl.h>
#include <errno.h>
#include <signal.h>
#include <sys/stat.h>
#include <sys/utsname.h>

#include <hiredis.h>

#include <vrt_util.h>
#include <vrt_public.h>
#include <vrt_simple.h>

struct config {
    char *pid_filename;

    int pidfile;
    int pid;
};

static struct config config;

static int show_help;
static int show_version;

static struct option long_options[] = {
    { "help",           no_argument,        NULL,   'h' },
    { "version",        no_argument,        NULL,   'V' },
    { "execute-file",   required_argument,  NULL,   'e' },
    { "pid-file",       required_argument,  NULL,   'p' },
    { NULL,             0,                  NULL,    0  }
};

static char short_options[] = "hVe:p:";

static void
vr_show_usage(void)
{
    printf(
        "Usage: viretest [-?hV] [-e execute-file] [-p pid-file]" CRLF
        "" CRLF);
    printf(
        "Options:" CRLF
        "  -h, --help             : this help" CRLF
        "  -V, --version          : show version and exit" CRLF
        "  -e, --execute-file     : vire execute file, default is src/vire" CRLF
        "  -p, --pid-file         : pid file" CRLF
        "" CRLF);
}

static void
vr_set_default_options(void)
{
    config.pid_filename = NULL;
}

static int
vr_get_options(int argc, char **argv)
{
    int c;

    opterr = 0;

    for (;;) {
        c = getopt_long(argc, argv, short_options, long_options, NULL);
        if (c == -1) {
            /* no more options */
            break;
        }

        switch (c) {
        case 'h':
            show_version = 1;
            show_help = 1;
            break;

        case 'V':
            show_version = 1;
            break;

        case 'e':
            set_execute_file(optarg);
            break;

        case 'p':
            config.pid_filename = optarg;
            break;

        case '?':
            switch (optopt) {
            case 'e':
            case 'p':
                test_log_error("vire: option -%c requires string",
                           optopt);
                break;

            default:
                test_log_error("vire: invalid option -- '%c'", optopt);
                break;
            }
            return VRT_ERROR;

        default:
            test_log_error("vire: invalid option -- '%c'", optopt);
            return VRT_ERROR;

        }
    }

    return VRT_OK;
}

int
main(int argc, char **argv)
{
    int ret;
    int ok_count = 0, all_count = 0;

    vr_set_default_options();

    ret = vr_get_options(argc, argv);
    if (ret != VRT_OK) {
        vr_show_usage();
        exit(1);
    }

    if (show_version) {
        test_log_out("This is viretest-%s", VR_VERSION_STRING);
        if (show_help) {
            vr_show_usage();
        }
        exit(0);
    }

    create_work_dir();

    test_log_out("Testing Vire version %s \n", VR_VERSION_STRING);
    
    ok_count+=simple_test(); all_count++;
    
clean:
    destroy_work_dir();

    if (ok_count == all_count)
        test_log_out("\n\\o/ \033[32;1mAll tests passed without errors!\033[0m\n");
    return VRT_OK;
}


================================================
FILE: tools/.gitignore
================================================
*.pyc
*.out
*.log