dist/redhat: don't try to adduser when user is already exists

Currently we get "failed adding user 'scylla'" on .rpm installation when user is already exists, we can skip it to prevent error. Fixes #1958 Signed-off-by: Takuya ASADA <syuu@scylladb.com> Message-Id: <1482550075-27939-1-git-send-email-syuu@scylladb.com> (cherry picked from commit f3e45bc9ef)
tests: Remove unintentional enablement of trace-level logging
2016-12-27 09:48:22 +02:00 · 2016-12-21 15:39:28 +01:00 · 2016-12-20 20:09:10 +01:00 · 2016-12-20 20:09:10 +01:00 · 2016-12-20 20:09:10 +01:00 · 2016-12-20 20:09:10 +01:00
883 changed files with 45765 additions and 11097 deletions
--- a/.github/ISSUE_TEMPLATE.md
+++ b/.github/ISSUE_TEMPLATE.md
@@ -0,0 +1,9 @@
+*Installation details*
+Scylla version (or git commit hash):
+Cluster size:
+OS (RHEL/CentOS/Ubuntu/AWS AMI):
+
+*Hardware details (for performance issues)*          Delete if unneeded
+Platform (physical/VM/cloud instance type/docker):
+Hardware: sockets= cores= hyperthreading= memory=
+Disks: (SSD/HDD, count)
--- a/.gitmodules
+++ b/.gitmodules
@@ -1,6 +1,6 @@
 [submodule "seastar"]
 	path = seastar
-	url = ../seastar
+	url = ../scylla-seastar
 	ignore = dirty
 [submodule "swagger-ui"]
 	path = swagger-ui
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
-#Scylla
+# Scylla

-##Building Scylla
+## Building Scylla

 In addition to required packages by Seastar, the following packages are required by Scylla.

@@ -8,14 +8,14 @@ In addition to required packages by Seastar, the following packages are required
 Scylla uses submodules, so make sure you pull the submodules first by doing:
 ```
 git submodule init
-git submodule update --recursive
+git submodule update --init --recursive
 ```

 ### Building and Running Scylla on Fedora
 * Installing required packages:

 ```
-sudo yum install yaml-cpp-devel lz4-devel zlib-devel snappy-devel jsoncpp-devel thrift-devel antlr3-tool antlr3-C++-devel libasan libubsan gcc-c++ gnutls-devel ninja-build ragel libaio-devel cryptopp-devel xfsprogs-devel numactl-devel hwloc-devel libpciaccess-devel libxml2-devel python3-pyparsing
+sudo dnf install yaml-cpp-devel lz4-devel zlib-devel snappy-devel jsoncpp-devel thrift-devel antlr3-tool antlr3-C++-devel libasan libubsan gcc-c++ gnutls-devel ninja-build ragel libaio-devel cryptopp-devel xfsprogs-devel numactl-devel hwloc-devel libpciaccess-devel libxml2-devel python3-pyparsing lksctp-tools-devel protobuf-devel protobuf-compiler systemd-devel libunwind-devel
 ```

 * Build Scylla
--- a/2
+++ b/2
@@ -1,6 +1,6 @@
 #!/bin/sh

-VERSION=666.development
+VERSION=1.4.3

 if test -f version
 then
--- a/api/api-doc/cache_service.json
+++ b/api/api-doc/cache_service.json
@@ -487,6 +487,36 @@
        }
      ]
    },
+    {
+      "path": "/cache_service/metrics/row/hits_moving_avrage",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get row hits moving avrage",
+          "type": "#/utils/rate_moving_average",
+          "nickname": "get_row_hits_moving_avrage",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
+    {
+      "path": "/cache_service/metrics/row/requests_moving_avrage",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get row requests moving avrage",
+          "type": "#/utils/rate_moving_average",
+          "nickname": "get_row_requests_moving_avrage",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
    {
      "path": "/cache_service/metrics/row/size",
      "operations": [
--- a/api/api-doc/collectd.json
+++ b/api/api-doc/collectd.json
@@ -55,6 +55,57 @@
                     "paramType":"query"
                  }
               ]
+            },
+            {
+               "method":"POST",
+               "summary":"Start reporting on one or more collectd metric",
+               "type":"void",
+               "nickname":"enable_collectd",
+               "produces":[
+                  "application/json"
+               ],
+               "parameters":[
+                  {
+                     "name":"pluginid",
+                     "description":"The plugin ID, describe the component the metric belongs to. Examples are cache, thrift, etc'. Regex are supported.The plugin ID, describe the component the metric belong to. Examples are: cache, thrift etc'. regex are supported",
+                     "required":true,
+                     "allowMultiple":false,
+                     "type":"string",
+                     "paramType":"path"
+                  },
+                  {
+                     "name":"instance",
+                     "description":"The plugin instance typically #CPU indicating per CPU metric. Regex are supported. Omit for all",
+                     "required":false,
+                     "allowMultiple":false,
+                     "type":"string",
+                     "paramType":"query"
+                  },
+                  {
+                     "name":"type",
+                     "description":"The plugin type, the type of the information. Examples are total_operations, bytes, total_operations, etc'. Regex are supported. Omit for all",
+                     "required":false,
+                     "allowMultiple":false,
+                     "type":"string",
+                     "paramType":"query"
+                  },
+                  {
+                     "name":"type_instance",
+                     "description":"The plugin type instance, the specific metric. Exampls are total_writes, total_size, zones, etc'. Regex are supported, Omit for all",
+                     "required":false,
+                     "allowMultiple":false,
+                     "type":"string",
+                     "paramType":"query"
+                  },
+                  {
+                     "name":"enable",
+                     "description":"set to true to enable all, anything else or omit to disable",
+                     "required":false,
+                     "allowMultiple":false,
+                     "type":"boolean",
+                     "paramType":"query"
+                  }
+               ]
            }
         ]
      },
@@ -63,10 +114,10 @@
         "operations":[
            {
               "method":"GET",
-               "summary":"Get a collectd value",
+               "summary":"Get a list of all collectd metrics and their status",
               "type":"array",
               "items":{
-                  "type":"type_instance_id"
+                  "type":"collectd_metric_status"
               },
               "nickname":"get_collectd_items",
               "produces":[
@@ -74,6 +125,25 @@
               ],
               "parameters":[
               ]
+            },
+            {
+               "method":"POST",
+               "summary":"Enable or disable all collectd metrics",
+               "type":"void",
+               "nickname":"enable_all_collectd",
+               "produces":[
+                  "application/json"
+               ],
+               "parameters":[
+                  {
+                     "name":"enable",
+                     "description":"set to true to enable all, anything else or omit to disable",
+                     "required":false,
+                     "allowMultiple":false,
+                     "type":"boolean",
+                     "paramType":"query"
+                  }
+               ]
            }
         ]
      }
@@ -113,6 +183,20 @@
               }
            }
         }
+      },
+      "collectd_metric_status":{
+         "id":"collectd_metric_status",
+         "description":"Holds a collectd id and an enable flag",
+         "properties":{
+            "id":{
+               "description":"The metric ID",
+               "type":"type_instance_id"
+            },
+            "enable":{
+               "description":"Is the metric enabled",
+               "type":"boolean"
+            }
+         }
      }
   }
 }
--- a/api/api-doc/column_family.json
+++ b/api/api-doc/column_family.json
@@ -1094,7 +1094,7 @@
               "method":"GET",
               "summary":"Get read latency histogram",
               "$ref": "#/utils/histogram",
-               "nickname":"get_read_latency_histogram",
+               "nickname":"get_read_latency_histogram_depricated",
               "produces":[
                  "application/json"
               ],
@@ -1121,6 +1121,49 @@
               "items":{
                  "$ref": "#/utils/histogram"
               },
+               "nickname":"get_all_read_latency_histogram_depricated",
+               "produces":[
+                  "application/json"
+               ],
+               "parameters":[
+               ]
+            }
+         ]
+      },
+      {
+         "path":"/column_family/metrics/read_latency/moving_average_histogram/{name}",
+         "operations":[
+            {
+               "method":"GET",
+               "summary":"Get read latency moving avrage histogram",
+               "$ref": "#/utils/rate_moving_average_and_histogram",
+               "nickname":"get_read_latency_histogram",
+               "produces":[
+                  "application/json"
+               ],
+               "parameters":[
+                  {
+                     "name":"name",
+                     "description":"The column family name in keysspace:name format",
+                     "required":true,
+                     "allowMultiple":false,
+                     "type":"string",
+                     "paramType":"path"
+                  }
+               ]
+            }
+         ]
+      },
+      {
+         "path":"/column_family/metrics/read_latency/moving_average_histogram/",
+         "operations":[
+            {
+               "method":"GET",
+               "summary":"Get read latency moving avrage histogram from all column family",
+               "type":"array",
+               "items":{
+                  "$ref": "#/utils/rate_moving_average_and_histogram"
+               },
               "nickname":"get_all_read_latency_histogram",
               "produces":[
                  "application/json"
@@ -1260,7 +1303,7 @@
               "method":"GET",
               "summary":"Get write latency histogram",
               "$ref": "#/utils/histogram",
-               "nickname":"get_write_latency_histogram",
+               "nickname":"get_write_latency_histogram_depricated",
               "produces":[
                  "application/json"
               ],
@@ -1287,6 +1330,49 @@
               "items":{
                  "$ref": "#/utils/histogram"
               },
+               "nickname":"get_all_write_latency_histogram_depricated",
+               "produces":[
+                  "application/json"
+               ],
+               "parameters":[
+               ]
+            }
+         ]
+      },
+      {
+         "path":"/column_family/metrics/write_latency/moving_average_histogram/{name}",
+         "operations":[
+            {
+               "method":"GET",
+               "summary":"Get write latency moving average histogram",
+               "$ref": "#/utils/rate_moving_average_and_histogram",
+               "nickname":"get_write_latency_histogram",
+               "produces":[
+                  "application/json"
+               ],
+               "parameters":[
+                  {
+                     "name":"name",
+                     "description":"The column family name in keysspace:name format",
+                     "required":true,
+                     "allowMultiple":false,
+                     "type":"string",
+                     "paramType":"path"
+                  }
+               ]
+            }
+         ]
+      },
+      {
+         "path":"/column_family/metrics/write_latency/moving_average_histogram/",
+         "operations":[
+            {
+               "method":"GET",
+               "summary":"Get write latency moving average histogram of all column family",
+               "type":"array",
+               "items":{
+                  "$ref": "#/utils/rate_moving_average_and_histogram"
+               },
               "nickname":"get_all_write_latency_histogram",
               "produces":[
                  "application/json"
--- a/api/api-doc/storage_proxy.json
+++ b/api/api-doc/storage_proxy.json
@@ -716,6 +716,36 @@
        }
      ]
    },
+    {
+      "path": "/storage_proxy/metrics/read/timeouts_rates",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get read metrics rates",
+          "type": "#/utils/rate_moving_average",
+          "nickname": "get_read_metrics_timeouts_rates",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
+    {
+      "path": "/storage_proxy/metrics/read/unavailables_rates",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get read metrics rates",
+          "type": "#/utils/rate_moving_average",
+          "nickname": "get_read_metrics_unavailables_rates",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
    {
      "path": "/storage_proxy/metrics/read/histogram",
      "operations": [
@@ -723,7 +753,7 @@
          "method": "GET",
          "summary": "Get read metrics",
          "$ref": "#/utils/histogram",
-          "nickname": "get_read_metrics_latency_histogram",
+          "nickname": "get_read_metrics_latency_histogram_depricated",
          "produces": [
            "application/json"
          ],
@@ -738,6 +768,36 @@
          "method": "GET",
          "summary": "Get range metrics",
          "$ref": "#/utils/histogram",
+          "nickname": "get_range_metrics_latency_histogram_depricated",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
+    {
+      "path": "/storage_proxy/metrics/read/moving_average_histogram",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get read metrics",
+          "$ref": "#/utils/rate_moving_average_and_histogram",
+          "nickname": "get_read_metrics_latency_histogram",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
+    {
+      "path": "/storage_proxy/metrics/range/moving_average_histogram",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get range metrics rate and histogram",
+          "$ref": "#/utils/rate_moving_average_and_histogram",
          "nickname": "get_range_metrics_latency_histogram",
          "produces": [
            "application/json"
@@ -776,6 +836,36 @@
        }
      ]
    },
+    {
+      "path": "/storage_proxy/metrics/range/timeouts_rates",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get range metrics rates",
+          "type": "#/utils/rate_moving_average",
+          "nickname": "get_range_metrics_timeouts_rates",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
+    {
+      "path": "/storage_proxy/metrics/range/unavailables_rates",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get range metrics rates",
+          "type": "#/utils/rate_moving_average",
+          "nickname": "get_range_metrics_unavailables_rates",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
    {
      "path": "/storage_proxy/metrics/write/timeouts",
      "operations": [
@@ -806,6 +896,36 @@
        }
      ]
    },
+    {
+      "path": "/storage_proxy/metrics/write/timeouts_rates",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get write metrics rates",
+          "type": "#/utils/rate_moving_average",
+          "nickname": "get_write_metrics_timeouts_rates",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
+    {
+      "path": "/storage_proxy/metrics/write/unavailables_rates",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get write metrics rates",
+          "type": "#/utils/rate_moving_average",
+          "nickname": "get_write_metrics_unavailables_rates",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
    {
      "path": "/storage_proxy/metrics/write/histogram",
      "operations": [
@@ -813,6 +933,21 @@
          "method": "GET",
          "summary": "Get write metrics",
          "$ref": "#/utils/histogram",
+          "nickname": "get_write_metrics_latency_histogram_depricated",
+          "produces": [
+            "application/json"
+          ],
+          "parameters": []
+        }
+      ]
+    },
+    {
+      "path": "/storage_proxy/metrics/write/moving_average_histogram",
+      "operations": [
+        {
+          "method": "GET",
+          "summary": "Get write metrics",
+          "$ref": "#/utils/rate_moving_average_and_histogram",
          "nickname": "get_write_metrics_latency_histogram",
          "produces": [
            "application/json"
--- a/api/api-doc/storage_service.json
+++ b/api/api-doc/storage_service.json
@@ -177,6 +177,22 @@
            }
         ]
      },
+      {
+         "path":"/storage_service/scylla_release_version",
+         "operations":[
+            {
+               "method":"GET",
+               "summary":"Fetch a string representation of the Scylla version.",
+               "type":"string",
+               "nickname":"get_scylla_release_version",
+               "produces":[
+                  "application/json"
+               ],
+               "parameters":[
+               ]
+            }
+         ]
+      },
      {
         "path":"/storage_service/schema_version",
         "operations":[
@@ -1720,6 +1736,57 @@
            }
         ]
      },
+      {
+         "path":"/storage_service/slow_query",
+         "operations":[
+            {
+               "method":"POST",
+               "summary":"Set slow query parameter",
+               "type":"void",
+               "nickname":"set_slow_query",
+               "produces":[
+                  "application/json"
+               ],
+               "parameters":[
+                  {
+                     "name":"enable",
+                     "description":"set it to true to enable, anything else to disable",
+                     "required":false,
+                     "allowMultiple":false,
+                     "type":"boolean",
+                     "paramType":"query"
+                  },
+                  {
+                     "name":"ttl",
+                     "description":"TTL in seconds",
+                     "required":false,
+                     "allowMultiple":false,
+                     "type":"long",
+                     "paramType":"query"
+                  },
+                  {
+                     "name":"threshold",
+                     "description":"Slow query record threshold in microseconds",
+                     "required":false,
+                     "allowMultiple":false,
+                     "type":"long",
+                     "paramType":"query"
+                  }
+               ]
+            },
+            {
+               "method":"GET",
+               "summary":"Returns the slow query record configuration.",
+               "type":"slow_query_info",
+               "nickname":"get_slow_query_info",
+               "produces":[
+                  "application/json"
+               ],
+               "parameters":[
+               ]
+            }
+         ]
+      },
      {
         "path":"/storage_service/auto_compaction/{keyspace}",
         "operations":[
@@ -2117,6 +2184,24 @@
            }
         }
      },
+      "slow_query_info": {
+         "id":"slow_query_info",
+         "description":"Slow query triggering information",
+         "properties":{
+            "enable":{
+               "type":"boolean",
+               "description":"Is slow query logging enable or disable"
+            },
+            "ttl":{
+               "type":"long",
+               "description":"The slow query TTL in seconds"
+            },
+            "threshold":{
+               "type":"long",
+               "description":"The slow query logging threshold in microseconds. Queries that takes longer, will be logged"
+            }
+         }
+      },
      "endpoint_detail":{
         "id":"endpoint_detail",
         "description":"Endpoint detail",
--- a/api/api-doc/utils.json
+++ b/api/api-doc/utils.json
@@ -65,6 +65,41 @@
               "description":"The series of values to which the counts in `buckets` correspond"
            }
         }
-      }
-   }
+      },
+    "rate_moving_average": {
+         "id":"rate_moving_average",
+         "description":"A meter metric which measures mean throughput and one, five, and fifteen-minute exponentially-weighted moving average throughputs",
+         "properties":{
+             "rates": {
+               "type":"array",
+               "items":{
+                  "type":"double"
+               },
+               "description":"One, five and fifteen mintues rates"
+            },
+            "mean_rate": {
+               "type":"double",
+               "description":"The mean rate from startup"
+            },
+            "count": {
+               "type":"long",
+               "description":"Total number of events from startup"
+            }
+         }
+    },
+    "rate_moving_average_and_histogram": {
+         "id":"rate_moving_average_and_histogram",
+         "description":"A timer metric which aggregates timing durations and provides duration statistics, plus throughput statistics",
+         "properties":{
+            "meter": {
+               "type":"rate_moving_average",
+               "description":"The metric rate moving average"
+            },
+            "hist": {
+               "type":"histogram",
+               "description":"The metric histogram"
+            }
+         }
+    }
+  }
 }
--- a/api/api.cc
+++ b/api/api.cc
@@ -61,10 +61,10 @@ future<> set_server_init(http_context& ctx) {
                new content_replace("html")));
        r.add(GET, url("/ui").remainder("path"), new httpd::directory_handler(ctx.api_dir,
                new content_replace("html")));
+        rb->set_api_doc(r);
        rb->register_function(r, "system",
                "The system related API");
        set_system(ctx, r);
-        rb->set_api_doc(r);
    });
 }

@@ -83,6 +83,10 @@ future<> set_server_storage_service(http_context& ctx) {
    return register_api(ctx, "storage_service", "The storage service API", set_storage_service);
 }

+future<> set_server_snitch(http_context& ctx) {
+    return register_api(ctx, "endpoint_snitch_info", "The endpoint snitch info API", set_endpoint_snitch);
+}
+
 future<> set_server_gossip(http_context& ctx) {
    return register_api(ctx, "gossiper",
                "The gossiper API", set_gossiper);
@@ -118,10 +122,6 @@ future<> set_server_gossip_settle(http_context& ctx) {
        rb->register_function(r, "cache_service",
                "The cache service API");
        set_cache_service(ctx,r);
-
-        rb->register_function(r, "endpoint_snitch_info",
-                "The endpoint snitch info API");
-        set_endpoint_snitch(ctx, r);
    });
 }

--- a/api/api.hh
+++ b/api/api.hh
@@ -110,61 +110,49 @@ future<json::json_return_type>  sum_stats(distributed<T>& d, V F::*f) {
    });
 }

-inline double pow2(double a) {
-    return a * a;
-}

-// FIXME: Move to utils::ihistogram::operator+=()
-inline utils::ihistogram add_histogram(utils::ihistogram res,
-        const utils::ihistogram& val) {
-    if (res.count == 0) {
-        return val;
-    }
-    if (val.count == 0) {
-        return std::move(res);
-    }
-    if (res.min > val.min) {
-        res.min = val.min;
-    }
-    if (res.max < val.max) {
-        res.max = val.max;
-    }
-    double ncount = res.count + val.count;
-    // To get an estimated sum we take the estimated mean
-    // and multiply it by the true count
-    res.sum = res.sum + val.mean * val.count;
-    double a = res.count/ncount;
-    double b = val.count/ncount;
-
-    double mean =  a * res.mean + b * val.mean;
-
-    res.variance = (res.variance + pow2(res.mean - mean) )* a +
-            (val.variance + pow2(val.mean -mean))* b;
-
-    res.mean = mean;
-    res.count = res.count + val.count;
-    for (auto i : val.sample) {
-        res.sample.push_back(i);
-    }
-    return res;
-}

 inline
 httpd::utils_json::histogram to_json(const utils::ihistogram& val) {
    httpd::utils_json::histogram h;
    h = val;
+    h.sum = val.estimated_sum();
+    return h;
+}
+
+inline
+httpd::utils_json::rate_moving_average meter_to_json(const utils::rate_moving_average& val) {
+    httpd::utils_json::rate_moving_average m;
+    m = val;
+    return m;
+}
+
+inline
+httpd::utils_json::rate_moving_average_and_histogram timer_to_json(const utils::rate_moving_average_and_histogram& val) {
+    httpd::utils_json::rate_moving_average_and_histogram h;
+    h.hist = to_json(val.hist);
+    h.meter = meter_to_json(val.rate);
    return h;
 }

 template<class T, class F>
-future<json::json_return_type>  sum_histogram_stats(distributed<T>& d, utils::ihistogram F::*f) {
+future<json::json_return_type>  sum_histogram_stats(distributed<T>& d, utils::timed_rate_moving_average_and_histogram F::*f) {

-    return d.map_reduce0([f](const T& p) {return p.get_stats().*f;}, utils::ihistogram(),
-            add_histogram).then([](const utils::ihistogram& val) {
+    return d.map_reduce0([f](const T& p) {return (p.get_stats().*f).hist;}, utils::ihistogram(),
+            std::plus<utils::ihistogram>()).then([](const utils::ihistogram& val) {
        return make_ready_future<json::json_return_type>(to_json(val));
    });
 }

+template<class T, class F>
+future<json::json_return_type>  sum_timer_stats(distributed<T>& d, utils::timed_rate_moving_average_and_histogram F::*f) {
+
+    return d.map_reduce0([f](const T& p) {return (p.get_stats().*f).rate();}, utils::rate_moving_average_and_histogram(),
+            std::plus<utils::rate_moving_average_and_histogram>()).then([](const utils::rate_moving_average_and_histogram& val) {
+        return make_ready_future<json::json_return_type>(timer_to_json(val));
+    });
+}
+
 inline int64_t min_int64(int64_t a, int64_t b) {
    return std::min(a,b);
 }
--- a/api/api_init.hh
+++ b/api/api_init.hh
@@ -38,6 +38,7 @@ struct http_context {
 };

 future<> set_server_init(http_context& ctx);
+future<> set_server_snitch(http_context& ctx);
 future<> set_server_storage_service(http_context& ctx);
 future<> set_server_gossip(http_context& ctx);
 future<> set_server_load_sstable(http_context& ctx);
--- a/api/cache_service.cc
+++ b/api/cache_service.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -194,30 +194,46 @@ void set_cache_service(http_context& ctx, routes& r) {
    });

    cs::get_row_capacity.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, 0, [](const column_family& cf) {
+        return map_reduce_cf(ctx, uint64_t(0), [](const column_family& cf) {
            return cf.get_row_cache().get_cache_tracker().region().occupancy().used_space();
        }, std::plus<uint64_t>());
    });

    cs::get_row_hits.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, 0, [](const column_family& cf) {
-            return cf.get_row_cache().stats().hits;
-        }, std::plus<int64_t>());
+        return map_reduce_cf(ctx, uint64_t(0), [](const column_family& cf) {
+            return cf.get_row_cache().stats().hits.count();
+        }, std::plus<uint64_t>());
    });

    cs::get_row_requests.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, 0, [](const column_family& cf) {
-            return cf.get_row_cache().stats().hits + cf.get_row_cache().stats().misses;
-        }, std::plus<int64_t>());
+        return map_reduce_cf(ctx, uint64_t(0), [](const column_family& cf) {
+            return cf.get_row_cache().stats().hits.count() + cf.get_row_cache().stats().misses.count();
+        }, std::plus<uint64_t>());
    });

    cs::get_row_hit_rate.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, ratio_holder(), [](const column_family& cf) {
-            return ratio_holder(cf.get_row_cache().stats().hits + cf.get_row_cache().stats().misses,
-                    cf.get_row_cache().stats().hits);
+            return ratio_holder(cf.get_row_cache().stats().hits.count() + cf.get_row_cache().stats().misses.count(),
+                    cf.get_row_cache().stats().hits.count());
        }, std::plus<ratio_holder>());
    });

+    cs::get_row_hits_moving_avrage.set(r, [&ctx] (std::unique_ptr<request> req) {
+        return map_reduce_cf_raw(ctx, utils::rate_moving_average(), [](const column_family& cf) {
+            return cf.get_row_cache().stats().hits.rate();
+        }, std::plus<utils::rate_moving_average>()).then([](const utils::rate_moving_average& m) {
+            return make_ready_future<json::json_return_type>(meter_to_json(m));
+        });
+    });
+
+    cs::get_row_requests_moving_avrage.set(r, [&ctx] (std::unique_ptr<request> req) {
+        return map_reduce_cf_raw(ctx, utils::rate_moving_average(), [](const column_family& cf) {
+            return cf.get_row_cache().stats().hits.rate() + cf.get_row_cache().stats().misses.rate();
+        }, std::plus<utils::rate_moving_average>()).then([](const utils::rate_moving_average& m) {
+            return make_ready_future<json::json_return_type>(meter_to_json(m));
+        });
+    });
+
    cs::get_row_size.set(r, [&ctx] (std::unique_ptr<request> req) {
        // In origin row size is the weighted size.
        // We currently do not support weights, so we use num entries instead
--- a/api/cache_service.hh
+++ b/api/cache_service.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/collectd.cc
+++ b/api/collectd.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -25,10 +25,14 @@
 #include "core/scollectd_api.hh"
 #include "endian.h"
 #include <boost/range/irange.hpp>
+#include <regex>

 namespace api {

 using namespace scollectd;
+using namespace httpd;
+
+using namespace json;
 namespace cd = httpd::collectd_json;

 static auto transformer(const std::vector<collectd_value>& values) {
@@ -49,6 +53,14 @@ static auto transformer(const std::vector<collectd_value>& values) {
    return collected_value;
 }

+
+static const char* str_to_regex(const sstring& v) {
+    if (v != "") {
+        return v.c_str();
+    }
+    return ".*";
+}
+
 void set_collectd(http_context& ctx, routes& r) {
    cd::get_collectd.set(r, [&ctx](std::unique_ptr<request> req) {

@@ -72,7 +84,7 @@ void set_collectd(http_context& ctx, routes& r) {
    });

    cd::get_collectd_items.set(r, [](const_req req) {
-        std::vector<cd::type_instance_id> res;
+        std::vector<cd::collectd_metric_status> res;
        auto ids = scollectd::get_collectd_ids();
        for (auto i: ids) {
            cd::type_instance_id id;
@@ -80,10 +92,44 @@ void set_collectd(http_context& ctx, routes& r) {
            id.plugin_instance = i.plugin_instance();
            id.type = i.type();
            id.type_instance = i.type_instance();
-            res.push_back(id);
+            cd::collectd_metric_status it;
+            it.id = id;
+            it.enable = scollectd::is_enabled(i);
+            res.push_back(it);
        }
        return res;
    });
+
+    cd::enable_collectd.set(r, [](std::unique_ptr<request> req) -> future<json::json_return_type> {
+        std::regex plugin(req->param["pluginid"].c_str());
+        std::regex instance(str_to_regex(req->get_query_param("instance")));
+        std::regex type(str_to_regex(req->get_query_param("type")));
+        std::regex type_instance(str_to_regex(req->get_query_param("type_instance")));
+        bool enable = strcasecmp(req->get_query_param("enable").c_str(), "true") == 0;
+        return smp::invoke_on_all([enable, plugin, instance, type, type_instance]() {
+            for (auto id: scollectd::get_collectd_ids()) {
+                if (std::regex_match(std::string(id.plugin()), plugin) &&
+                        std::regex_match(std::string(id.plugin_instance()), instance) &&
+                        std::regex_match(std::string(id.type()), type) &&
+                        std::regex_match(std::string(id.type_instance()), type_instance)) {
+                    scollectd::enable(id, enable);
+                }
+            }
+        }).then([] {
+            return json::json_return_type(json_void());
+        });
+    });
+
+    cd::enable_all_collectd.set(r, [](std::unique_ptr<request> req) -> future<json::json_return_type> {
+        bool enable = strcasecmp(req->get_query_param("enable").c_str(), "true") == 0;
+        return smp::invoke_on_all([enable] {
+            for (auto id: scollectd::get_collectd_ids()) {
+                scollectd::enable(id, enable);
+            }
+        }).then([] {
+            return json::json_return_type(json_void());
+        });
+    });
 }

 }
--- a/api/collectd.hh
+++ b/api/collectd.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/column_family.cc
+++ b/api/column_family.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -24,7 +24,7 @@
 #include <vector>
 #include "http/exception.hh"
 #include "sstables/sstables.hh"
-#include "sstables/estimated_histogram.hh"
+#include "utils/estimated_histogram.hh"
 #include <algorithm>

 namespace api {
@@ -40,7 +40,7 @@ const utils::UUID& get_uuid(const sstring& name, const database& db) {
    if (pos == sstring::npos) {
        pos  = name.find(":");
        if (pos == sstring::npos) {
-            throw bad_param_exception("Column family name should be in keyspace::column_family format");
+            throw bad_param_exception("Column family name should be in keyspace:column_family format");
        }
        end = pos + 1;
    } else {
@@ -77,14 +77,14 @@ future<json::json_return_type>  get_cf_stats(http_context& ctx,
 }

 static future<json::json_return_type>  get_cf_stats_count(http_context& ctx, const sstring& name,
-        utils::ihistogram column_family::stats::*f) {
+        utils::timed_rate_moving_average_and_histogram column_family::stats::*f) {
    return map_reduce_cf(ctx, name, int64_t(0), [f](const column_family& cf) {
-        return (cf.get_stats().*f).count;
+        return (cf.get_stats().*f).hist.count;
    }, std::plus<int64_t>());
 }

 static future<json::json_return_type>  get_cf_stats_sum(http_context& ctx, const sstring& name,
-        utils::ihistogram column_family::stats::*f) {
+        utils::timed_rate_moving_average_and_histogram column_family::stats::*f) {
    auto uuid = get_uuid(name, ctx.db.local());
    return ctx.db.map_reduce0([uuid, f](database& db) {
        // Histograms information is sample of the actual load
@@ -92,7 +92,7 @@ static future<json::json_return_type>  get_cf_stats_sum(http_context& ctx, const
        // with count. The information is gather in nano second,
        // but reported in micro
        column_family& cf = db.find_column_family(uuid);
-        return ((cf.get_stats().*f).count/1000.0) * (cf.get_stats().*f).mean;
+        return ((cf.get_stats().*f).hist.count/1000.0) * (cf.get_stats().*f).hist.mean;
    }, 0.0, std::plus<double>()).then([](double res) {
        return make_ready_future<json::json_return_type>((int64_t)res);
    });
@@ -100,28 +100,29 @@ static future<json::json_return_type>  get_cf_stats_sum(http_context& ctx, const


 static future<json::json_return_type>  get_cf_stats_count(http_context& ctx,
-        utils::ihistogram column_family::stats::*f) {
+        utils::timed_rate_moving_average_and_histogram column_family::stats::*f) {
    return map_reduce_cf(ctx, int64_t(0), [f](const column_family& cf) {
-        return (cf.get_stats().*f).count;
+        return (cf.get_stats().*f).hist.count;
    }, std::plus<int64_t>());
 }

 static future<json::json_return_type>  get_cf_histogram(http_context& ctx, const sstring& name,
-        utils::ihistogram column_family::stats::*f) {
+        utils::timed_rate_moving_average_and_histogram column_family::stats::*f) {
    utils::UUID uuid = get_uuid(name, ctx.db.local());
-    return ctx.db.map_reduce0([f, uuid](const database& p) {return p.find_column_family(uuid).get_stats().*f;},
+    return ctx.db.map_reduce0([f, uuid](const database& p) {
+        return (p.find_column_family(uuid).get_stats().*f).hist;},
            utils::ihistogram(),
-            add_histogram)
+            std::plus<utils::ihistogram>())
            .then([](const utils::ihistogram& val) {
                return make_ready_future<json::json_return_type>(to_json(val));
    });
 }

-static future<json::json_return_type> get_cf_histogram(http_context& ctx, utils::ihistogram column_family::stats::*f) {
+static future<json::json_return_type> get_cf_histogram(http_context& ctx, utils::timed_rate_moving_average_and_histogram column_family::stats::*f) {
    std::function<utils::ihistogram(const database&)> fun = [f] (const database& db)  {
        utils::ihistogram res;
        for (auto i : db.get_column_families()) {
-            res = add_histogram(res, i.second->get_stats().*f);
+            res += (i.second->get_stats().*f).hist;
        }
        return res;
    };
@@ -132,6 +133,33 @@ static future<json::json_return_type> get_cf_histogram(http_context& ctx, utils:
    });
 }

+static future<json::json_return_type>  get_cf_rate_and_histogram(http_context& ctx, const sstring& name,
+        utils::timed_rate_moving_average_and_histogram column_family::stats::*f) {
+    utils::UUID uuid = get_uuid(name, ctx.db.local());
+    return ctx.db.map_reduce0([f, uuid](const database& p) {
+        return (p.find_column_family(uuid).get_stats().*f).rate();},
+            utils::rate_moving_average_and_histogram(),
+            std::plus<utils::rate_moving_average_and_histogram>())
+            .then([](const utils::rate_moving_average_and_histogram& val) {
+                return make_ready_future<json::json_return_type>(timer_to_json(val));
+    });
+}
+
+static future<json::json_return_type> get_cf_rate_and_histogram(http_context& ctx, utils::timed_rate_moving_average_and_histogram column_family::stats::*f) {
+    std::function<utils::rate_moving_average_and_histogram(const database&)> fun = [f] (const database& db)  {
+        utils::rate_moving_average_and_histogram res;
+        for (auto i : db.get_column_families()) {
+            res += (i.second->get_stats().*f).rate();
+        }
+        return res;
+    };
+    return ctx.db.map(fun).then([](const std::vector<utils::rate_moving_average_and_histogram> &res) {
+        std::vector<httpd::utils_json::rate_moving_average_and_histogram> r;
+        boost::copy(res | boost::adaptors::transformed(timer_to_json), std::back_inserter(r));
+        return make_ready_future<json::json_return_type>(r);
+    });
+}
+
 static future<json::json_return_type> get_cf_unleveled_sstables(http_context& ctx, const sstring& name) {
    return map_reduce_cf(ctx, name, int64_t(0), [](const column_family& cf) {
        return cf.get_unleveled_sstables();
@@ -141,7 +169,7 @@ static future<json::json_return_type> get_cf_unleveled_sstables(http_context& ct
 static int64_t min_row_size(column_family& cf) {
    int64_t res = INT64_MAX;
    for (auto i: *cf.get_sstables() ) {
-        res = std::min(res, i.second->get_stats_metadata().estimated_row_size.min());
+        res = std::min(res, i->get_stats_metadata().estimated_row_size.min());
    }
    return (res == INT64_MAX) ? 0 : res;
 }
@@ -149,7 +177,7 @@ static int64_t min_row_size(column_family& cf) {
 static int64_t max_row_size(column_family& cf) {
    int64_t res = 0;
    for (auto i: *cf.get_sstables() ) {
-        res = std::max(i.second->get_stats_metadata().estimated_row_size.max(), res);
+        res = std::max(i->get_stats_metadata().estimated_row_size.max(), res);
    }
    return res;
 }
@@ -166,13 +194,95 @@ static double update_ratio(double acc, double f, double total) {
 static ratio_holder mean_row_size(column_family& cf) {
    ratio_holder res;
    for (auto i: *cf.get_sstables() ) {
-        auto c = i.second->get_stats_metadata().estimated_row_size.count();
-        res.sub += i.second->get_stats_metadata().estimated_row_size.mean() * c;
+        auto c = i->get_stats_metadata().estimated_row_size.count();
+        res.sub += i->get_stats_metadata().estimated_row_size.mean() * c;
        res.total += c;
    }
    return res;
 }

+static std::unordered_map<sstring, uint64_t> merge_maps(std::unordered_map<sstring, uint64_t> a,
+        const std::unordered_map<sstring, uint64_t>& b) {
+    a.insert(b.begin(), b.end());
+    return a;
+}
+
+static json::json_return_type sum_map(const std::unordered_map<sstring, uint64_t>& val) {
+    uint64_t res = 0;
+    for (auto i : val) {
+        res += i.second;
+    }
+    return res;
+}
+
+static future<json::json_return_type>  sum_sstable(http_context& ctx, const sstring name, bool total) {
+    auto uuid = get_uuid(name, ctx.db.local());
+    return ctx.db.map_reduce0([uuid, total](database& db) {
+        std::unordered_map<sstring, uint64_t> m;
+        auto sstables = (total) ? db.find_column_family(uuid).get_sstables_including_compacted_undeleted() :
+                db.find_column_family(uuid).get_sstables();
+        for (auto t : *sstables) {
+            m[t->get_filename()] = t->bytes_on_disk();
+        }
+        return m;
+    }, std::unordered_map<sstring, uint64_t>(), merge_maps).
+            then([](const std::unordered_map<sstring, uint64_t>& val) {
+        return sum_map(val);
+    });
+}
+
+
+static future<json::json_return_type> sum_sstable(http_context& ctx, bool total) {
+    return map_reduce_cf_raw(ctx, std::unordered_map<sstring, uint64_t>(), [total](column_family& cf) {
+        std::unordered_map<sstring, uint64_t> m;
+        auto sstables = (total) ? cf.get_sstables_including_compacted_undeleted() :
+                cf.get_sstables();
+        for (auto t : *sstables) {
+            m[t->get_filename()] = t->bytes_on_disk();
+        }
+        return m;
+    },merge_maps).then([](const std::unordered_map<sstring, uint64_t>& val) {
+        return sum_map(val);
+    });
+}
+
+template <typename T>
+class sum_ratio {
+    uint64_t _n = 0;
+    T _total = 0;
+public:
+    future<> operator()(T value) {
+        if (value > 0) {
+            _total += value;
+            _n++;
+        }
+        return make_ready_future<>();
+    }
+    // Returns average value of all registered ratios.
+    T get() && {
+        return _n ? (_total / _n) : T(0);
+    }
+};
+
+static double get_compression_ratio(column_family& cf) {
+    sum_ratio<double> result;
+    for (auto i : *cf.get_sstables()) {
+        auto compression_ratio = i->get_compression_ratio();
+        if (compression_ratio != sstables::metadata_collector::NO_COMPRESSION_RATIO) {
+            result(compression_ratio);
+        }
+    }
+    return std::move(result).get();
+}
+
+static std::vector<uint64_t> concat_sstable_count_per_level(std::vector<uint64_t> a, std::vector<uint64_t>&& b) {
+    a.resize(std::max(a.size(), b.size()), 0UL);
+    for (auto i = 0U; i < b.size(); i++) {
+        a[i] += b[i];
+    }
+    return a;
+}
+
 void set_column_family(http_context& ctx, routes& r) {
    cf::get_column_family_name.set(r, [&ctx] (const_req req){
        vector<sstring> res;
@@ -293,21 +403,21 @@ void set_column_family(http_context& ctx, routes& r) {
    });

    cf::get_estimated_row_size_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, req->param["name"], sstables::estimated_histogram(0), [](column_family& cf) {
-            sstables::estimated_histogram res(0);
+        return map_reduce_cf(ctx, req->param["name"], utils::estimated_histogram(0), [](column_family& cf) {
+            utils::estimated_histogram res(0);
            for (auto i: *cf.get_sstables() ) {
-                res.merge(i.second->get_stats_metadata().estimated_row_size);
+                res.merge(i->get_stats_metadata().estimated_row_size);
            }
            return res;
        },
-        sstables::merge, utils_json::estimated_histogram());
+        utils::estimated_histogram_merge, utils_json::estimated_histogram());
    });

    cf::get_estimated_row_count.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, req->param["name"], int64_t(0), [](column_family& cf) {
            uint64_t res = 0;
            for (auto i: *cf.get_sstables() ) {
-                res += i.second->get_stats_metadata().estimated_row_size.count();
+                res += i->get_stats_metadata().estimated_row_size.count();
            }
            return res;
        },
@@ -315,14 +425,14 @@ void set_column_family(http_context& ctx, routes& r) {
    });

    cf::get_estimated_column_count_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, req->param["name"], sstables::estimated_histogram(0), [](column_family& cf) {
-            sstables::estimated_histogram res(0);
+        return map_reduce_cf(ctx, req->param["name"], utils::estimated_histogram(0), [](column_family& cf) {
+            utils::estimated_histogram res(0);
            for (auto i: *cf.get_sstables() ) {
-                res.merge(i.second->get_stats_metadata().estimated_column_count);
+                res.merge(i->get_stats_metadata().estimated_column_count);
            }
            return res;
        },
-        sstables::merge, utils_json::estimated_histogram());
+        utils::estimated_histogram_merge, utils_json::estimated_histogram());
    });

    cf::get_all_compression_ratio.set(r, [] (std::unique_ptr<request> req) {
@@ -355,10 +465,14 @@ void set_column_family(http_context& ctx, routes& r) {
        return get_cf_stats_count(ctx, &column_family::stats::writes);
    });

-    cf::get_read_latency_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
+    cf::get_read_latency_histogram_depricated.set(r, [&ctx] (std::unique_ptr<request> req) {
        return get_cf_histogram(ctx, req->param["name"], &column_family::stats::reads);
    });

+    cf::get_read_latency_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
+        return get_cf_rate_and_histogram(ctx, req->param["name"], &column_family::stats::reads);
+    });
+
    cf::get_read_latency.set(r, [&ctx] (std::unique_ptr<request> req) {
        return get_cf_stats_sum(ctx,req->param["name"] ,&column_family::stats::reads);
    });
@@ -367,24 +481,40 @@ void set_column_family(http_context& ctx, routes& r) {
        return get_cf_stats_sum(ctx, req->param["name"] ,&column_family::stats::writes);
    });

-    cf::get_all_read_latency_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
+    cf::get_all_read_latency_histogram_depricated.set(r, [&ctx] (std::unique_ptr<request> req) {
        return get_cf_histogram(ctx, &column_family::stats::writes);
    });

-    cf::get_write_latency_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
+    cf::get_all_read_latency_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
+        return get_cf_rate_and_histogram(ctx, &column_family::stats::writes);
+    });
+
+    cf::get_write_latency_histogram_depricated.set(r, [&ctx] (std::unique_ptr<request> req) {
        return get_cf_histogram(ctx, req->param["name"], &column_family::stats::writes);
    });

-    cf::get_all_write_latency_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
+    cf::get_write_latency_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
+        return get_cf_rate_and_histogram(ctx, req->param["name"], &column_family::stats::writes);
+    });
+
+    cf::get_all_write_latency_histogram_depricated.set(r, [&ctx] (std::unique_ptr<request> req) {
        return get_cf_histogram(ctx, &column_family::stats::writes);
    });

+    cf::get_all_write_latency_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
+        return get_cf_rate_and_histogram(ctx, &column_family::stats::writes);
+    });
+
    cf::get_pending_compactions.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return get_cf_stats(ctx, req->param["name"], &column_family::stats::pending_compactions);
+        return map_reduce_cf(ctx, req->param["name"], int64_t(0), [](column_family& cf) {
+            return cf.get_compaction_strategy().estimated_pending_compactions(cf);
+        }, std::plus<int64_t>());
    });

    cf::get_all_pending_compactions.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return get_cf_stats(ctx, &column_family::stats::pending_compactions);
+        return map_reduce_cf(ctx, int64_t(0), [](column_family& cf) {
+            return cf.get_compaction_strategy().estimated_pending_compactions(cf);
+        }, std::plus<int64_t>());
    });

    cf::get_live_ss_table_count.set(r, [&ctx] (std::unique_ptr<request> req) {
@@ -400,19 +530,19 @@ void set_column_family(http_context& ctx, routes& r) {
    });

    cf::get_live_disk_space_used.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return get_cf_stats(ctx, req->param["name"], &column_family::stats::live_disk_space_used);
+        return sum_sstable(ctx, req->param["name"], false);
    });

    cf::get_all_live_disk_space_used.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return get_cf_stats(ctx, &column_family::stats::live_disk_space_used);
+        return sum_sstable(ctx, false);
    });

    cf::get_total_disk_space_used.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return get_cf_stats(ctx, req->param["name"], &column_family::stats::total_disk_space_used);
+        return sum_sstable(ctx, req->param["name"], true);
    });

    cf::get_all_total_disk_space_used.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return get_cf_stats(ctx, &column_family::stats::total_disk_space_used);
+        return sum_sstable(ctx, true);
    });

    cf::get_min_row_size.set(r, [&ctx] (std::unique_ptr<request> req) {
@@ -442,7 +572,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_bloom_filter_false_positives.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, req->param["name"], uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return s + sst.second->filter_get_false_positive();
+                return s + sst->filter_get_false_positive();
            });
        }, std::plus<uint64_t>());
    });
@@ -450,7 +580,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_all_bloom_filter_false_positives.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return s + sst.second->filter_get_false_positive();
+                return s + sst->filter_get_false_positive();
            });
        }, std::plus<uint64_t>());
    });
@@ -458,7 +588,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_recent_bloom_filter_false_positives.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, req->param["name"], uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return s + sst.second->filter_get_recent_false_positive();
+                return s + sst->filter_get_recent_false_positive();
            });
        }, std::plus<uint64_t>());
    });
@@ -466,7 +596,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_all_recent_bloom_filter_false_positives.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return s + sst.second->filter_get_recent_false_positive();
+                return s + sst->filter_get_recent_false_positive();
            });
        }, std::plus<uint64_t>());
    });
@@ -474,8 +604,8 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_bloom_filter_false_ratio.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, req->param["name"], double(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), double(0), [](double s, auto& sst) {
-                double f = sst.second->filter_get_false_positive();
-                return update_ratio(s, f, f + sst.second->filter_get_true_positive());
+                double f = sst->filter_get_false_positive();
+                return update_ratio(s, f, f + sst->filter_get_true_positive());
            });
        }, std::plus<double>());
    });
@@ -483,8 +613,8 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_all_bloom_filter_false_ratio.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, double(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), double(0), [](double s, auto& sst) {
-                double f = sst.second->filter_get_false_positive();
-                return update_ratio(s, f, f + sst.second->filter_get_true_positive());
+                double f = sst->filter_get_false_positive();
+                return update_ratio(s, f, f + sst->filter_get_true_positive());
            });
        }, std::plus<double>());
    });
@@ -492,8 +622,8 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_recent_bloom_filter_false_ratio.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, req->param["name"], double(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), double(0), [](double s, auto& sst) {
-                double f = sst.second->filter_get_recent_false_positive();
-                return update_ratio(s, f, f + sst.second->filter_get_recent_true_positive());
+                double f = sst->filter_get_recent_false_positive();
+                return update_ratio(s, f, f + sst->filter_get_recent_true_positive());
            });
        }, std::plus<double>());
    });
@@ -501,8 +631,8 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_all_recent_bloom_filter_false_ratio.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, double(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), double(0), [](double s, auto& sst) {
-                double f = sst.second->filter_get_recent_false_positive();
-                return update_ratio(s, f, f + sst.second->filter_get_recent_true_positive());
+                double f = sst->filter_get_recent_false_positive();
+                return update_ratio(s, f, f + sst->filter_get_recent_true_positive());
            });
        }, std::plus<double>());
    });
@@ -510,7 +640,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_bloom_filter_disk_space_used.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, req->param["name"], uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return sst.second->filter_size();
+                return sst->filter_size();
            });
        }, std::plus<uint64_t>());
    });
@@ -518,7 +648,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_all_bloom_filter_disk_space_used.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return sst.second->filter_size();
+                return sst->filter_size();
            });
        }, std::plus<uint64_t>());
    });
@@ -526,7 +656,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_bloom_filter_off_heap_memory_used.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, req->param["name"], uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return sst.second->filter_memory_size();
+                return sst->filter_memory_size();
            });
        }, std::plus<uint64_t>());
    });
@@ -534,7 +664,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_all_bloom_filter_off_heap_memory_used.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return sst.second->filter_memory_size();
+                return sst->filter_memory_size();
            });
        }, std::plus<uint64_t>());
    });
@@ -542,7 +672,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_index_summary_off_heap_memory_used.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, req->param["name"], uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return sst.second->get_summary().memory_footprint();
+                return sst->get_summary().memory_footprint();
            });
        }, std::plus<uint64_t>());
    });
@@ -550,7 +680,7 @@ void set_column_family(http_context& ctx, routes& r) {
    cf::get_all_index_summary_off_heap_memory_used.set(r, [&ctx] (std::unique_ptr<request> req) {
        return map_reduce_cf(ctx, uint64_t(0), [] (column_family& cf) {
            return std::accumulate(cf.get_sstables()->begin(), cf.get_sstables()->end(), uint64_t(0), [](uint64_t s, auto& sst) {
-                return sst.second->get_summary().memory_footprint();
+                return sst->get_summary().memory_footprint();
            });
        }, std::plus<uint64_t>());
    });
@@ -623,27 +753,35 @@ void set_column_family(http_context& ctx, routes& r) {
    });

    cf::get_row_cache_hit.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, req->param["name"], int64_t(0), [](const column_family& cf) {
-            return cf.get_row_cache().stats().hits;
-        }, std::plus<int64_t>());
+        return map_reduce_cf_raw(ctx, req->param["name"], utils::rate_moving_average(), [](const column_family& cf) {
+            return cf.get_row_cache().stats().hits.rate();
+        }, std::plus<utils::rate_moving_average>()).then([](const utils::rate_moving_average& m) {
+            return make_ready_future<json::json_return_type>(meter_to_json(m));
+        });
    });

    cf::get_all_row_cache_hit.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, int64_t(0), [](const column_family& cf) {
-            return cf.get_row_cache().stats().hits;
-        }, std::plus<int64_t>());
+        return map_reduce_cf_raw(ctx, utils::rate_moving_average(), [](const column_family& cf) {
+            return cf.get_row_cache().stats().hits.rate();
+        }, std::plus<utils::rate_moving_average>()).then([](const utils::rate_moving_average& m) {
+            return make_ready_future<json::json_return_type>(meter_to_json(m));
+        });
    });

    cf::get_row_cache_miss.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, req->param["name"], int64_t(0), [](const column_family& cf) {
-            return cf.get_row_cache().stats().misses;
-        }, std::plus<int64_t>());
+        return map_reduce_cf_raw(ctx, req->param["name"], utils::rate_moving_average(), [](const column_family& cf) {
+            return cf.get_row_cache().stats().misses.rate();
+        }, std::plus<utils::rate_moving_average>()).then([](const utils::rate_moving_average& m) {
+            return make_ready_future<json::json_return_type>(meter_to_json(m));
+        });
    });

    cf::get_all_row_cache_miss.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, int64_t(0), [](const column_family& cf) {
-            return cf.get_row_cache().stats().misses;
-        }, std::plus<int64_t>());
+        return map_reduce_cf_raw(ctx, utils::rate_moving_average(), [](const column_family& cf) {
+            return cf.get_row_cache().stats().misses.rate();
+        }, std::plus<utils::rate_moving_average>()).then([](const utils::rate_moving_average& m) {
+            return make_ready_future<json::json_return_type>(meter_to_json(m));
+        });

    });

@@ -669,10 +807,10 @@ void set_column_family(http_context& ctx, routes& r) {
    });

    cf::get_sstables_per_read_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, req->param["name"], sstables::estimated_histogram(0), [](column_family& cf) {
+        return map_reduce_cf(ctx, req->param["name"], utils::estimated_histogram(0), [](column_family& cf) {
            return cf.get_stats().estimated_sstable_per_read;
        },
-        sstables::merge, utils_json::estimated_histogram());
+        utils::estimated_histogram_merge, utils_json::estimated_histogram());
    });

    cf::get_tombstone_scanned_histogram.set(r, [&ctx] (std::unique_ptr<request> req) {
@@ -719,25 +857,29 @@ void set_column_family(http_context& ctx, routes& r) {
        return std::vector<sstring>();
    });

-    cf::get_compression_ratio.set(r, [](const_req) {
-        // FIXME
-        // Currently there are no compression information
-        // so we return 0 as the ratio
-        return 0;
+    cf::get_compression_ratio.set(r, [&ctx](std::unique_ptr<request> req) {
+        auto uuid = get_uuid(req->param["name"], ctx.db.local());
+
+        return ctx.db.map_reduce(sum_ratio<double>(), [uuid](database& db) {
+            column_family& cf = db.find_column_family(uuid);
+            return make_ready_future<double>(get_compression_ratio(cf));
+        }).then([] (const double& result) {
+            return make_ready_future<json::json_return_type>(result);
+        });
    });

    cf::get_read_latency_estimated_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, req->param["name"], sstables::estimated_histogram(0), [](column_family& cf) {
+        return map_reduce_cf(ctx, req->param["name"], utils::estimated_histogram(0), [](column_family& cf) {
            return cf.get_stats().estimated_read;
        },
-        sstables::merge, utils_json::estimated_histogram());
+        utils::estimated_histogram_merge, utils_json::estimated_histogram());
    });

    cf::get_write_latency_estimated_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
-        return map_reduce_cf(ctx, req->param["name"], sstables::estimated_histogram(0), [](column_family& cf) {
+        return map_reduce_cf(ctx, req->param["name"], utils::estimated_histogram(0), [](column_family& cf) {
            return cf.get_stats().estimated_write;
        },
-        sstables::merge, utils_json::estimated_histogram());
+        utils::estimated_histogram_merge, utils_json::estimated_histogram());
    });

    cf::set_compaction_strategy_class.set(r, [&ctx](std::unique_ptr<request> req) {
@@ -766,12 +908,11 @@ void set_column_family(http_context& ctx, routes& r) {
    });

    cf::get_sstable_count_per_level.set(r, [&ctx](std::unique_ptr<request> req) {
-        // TBD
-        // FIXME
-        // This is a workaround, until there will be an API to return the count
-        // per level, we return an empty array
-        vector<uint64_t> res;
-        return make_ready_future<json::json_return_type>(res);
+        return map_reduce_cf_raw(ctx, req->param["name"], std::vector<uint64_t>(), [](const column_family& cf) {
+            return cf.sstable_count_per_level();
+        }, concat_sstable_count_per_level).then([](const std::vector<uint64_t>& res) {
+            return make_ready_future<json::json_return_type>(res);
+        });
    });
 }
 }
--- a/api/column_family.hh
+++ b/api/column_family.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -34,31 +34,44 @@ future<> foreach_column_family(http_context& ctx, const sstring& name, std::func


 template<class Mapper, class I, class Reducer>
-future<json::json_return_type> map_reduce_cf(http_context& ctx, const sstring& name, I init,
+future<I> map_reduce_cf_raw(http_context& ctx, const sstring& name, I init,
        Mapper mapper, Reducer reducer) {
    auto uuid = get_uuid(name, ctx.db.local());
    return ctx.db.map_reduce0([mapper, uuid](database& db) {
        return mapper(db.find_column_family(uuid));
-    }, init, reducer).then([](const I& res) {
+    }, init, reducer);
+}
+
+
+template<class Mapper, class I, class Reducer>
+future<json::json_return_type> map_reduce_cf(http_context& ctx, const sstring& name, I init,
+        Mapper mapper, Reducer reducer) {
+    return map_reduce_cf_raw(ctx, name, init, mapper, reducer).then([](const I& res) {
        return make_ready_future<json::json_return_type>(res);
    });
 }

 template<class Mapper, class I, class Reducer, class Result>
-future<json::json_return_type> map_reduce_cf(http_context& ctx, const sstring& name, I init,
+future<I> map_reduce_cf_raw(http_context& ctx, const sstring& name, I init,
        Mapper mapper, Reducer reducer, Result result) {
    auto uuid = get_uuid(name, ctx.db.local());
    return ctx.db.map_reduce0([mapper, uuid](database& db) {
        return mapper(db.find_column_family(uuid));
-    }, init, reducer).then([result](const I& res) mutable {
+    }, init, reducer);
+}
+
+
+template<class Mapper, class I, class Reducer, class Result>
+future<json::json_return_type> map_reduce_cf(http_context& ctx, const sstring& name, I init,
+        Mapper mapper, Reducer reducer, Result result) {
+    return map_reduce_cf_raw(ctx, name, init, mapper, reducer, result).then([result](const I& res) mutable {
        result = res;
        return make_ready_future<json::json_return_type>(result);
    });
 }

-
 template<class Mapper, class I, class Reducer>
-future<json::json_return_type> map_reduce_cf(http_context& ctx, I init,
+future<I> map_reduce_cf_raw(http_context& ctx, I init,
        Mapper mapper, Reducer reducer) {
    return ctx.db.map_reduce0([mapper, init, reducer](database& db) {
        auto res = init;
@@ -66,10 +79,18 @@ future<json::json_return_type> map_reduce_cf(http_context& ctx, I init,
            res = reducer(res, mapper(*i.second.get()));
        }
        return res;
-    }, init, reducer).then([](const I& res) {
+    }, init, reducer);
+}
+
+
+template<class Mapper, class I, class Reducer>
+future<json::json_return_type> map_reduce_cf(http_context& ctx, I init,
+        Mapper mapper, Reducer reducer) {
+    return map_reduce_cf_raw(ctx, init, mapper, reducer).then([](const I& res) {
        return make_ready_future<json::json_return_type>(res);
    });
 }
+
 future<json::json_return_type>  get_cf_stats(http_context& ctx, const sstring& name,
        int64_t column_family::stats::*f);

--- a/api/commitlog.cc
+++ b/api/commitlog.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/commitlog.hh
+++ b/api/commitlog.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/compaction_manager.cc
+++ b/api/compaction_manager.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -22,6 +22,7 @@
 #include "compaction_manager.hh"
 #include "api/api-doc/compaction_manager.json.hh"
 #include "db/system_keyspace.hh"
+#include "column_family.hh"

 namespace api {

@@ -78,7 +79,9 @@ void set_compaction_manager(http_context& ctx, routes& r) {
    });

    cm::get_pending_tasks.set(r, [&ctx] (std::unique_ptr<request> req) {
-        return get_cm_stats(ctx, &compaction_manager::stats::pending_tasks);
+        return map_reduce_cf(ctx, int64_t(0), [](column_family& cf) {
+            return cf.get_compaction_strategy().estimated_pending_compactions(cf);
+        }, std::plus<int64_t>());
    });

    cm::get_completed_tasks.set(r, [&ctx] (std::unique_ptr<request> req) {
--- a/api/compaction_manager.hh
+++ b/api/compaction_manager.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/endpoint_snitch.cc
+++ b/api/endpoint_snitch.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/endpoint_snitch.hh
+++ b/api/endpoint_snitch.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/failure_detector.cc
+++ b/api/failure_detector.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/failure_detector.hh
+++ b/api/failure_detector.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/gossiper.cc
+++ b/api/gossiper.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/gossiper.hh
+++ b/api/gossiper.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/hinted_handoff.cc
+++ b/api/hinted_handoff.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/hinted_handoff.hh
+++ b/api/hinted_handoff.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/lsa.cc
+++ b/api/lsa.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/lsa.hh
+++ b/api/lsa.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/messaging_service.cc
+++ b/api/messaging_service.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/messaging_service.hh
+++ b/api/messaging_service.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/storage_proxy.cc
+++ b/api/storage_proxy.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -33,17 +33,36 @@ namespace sp = httpd::storage_proxy_json;
 using proxy = service::storage_proxy;
 using namespace json;

-static future<json::json_return_type>  sum_estimated_histogram(http_context& ctx, sstables::estimated_histogram proxy::stats::*f) {
-    return ctx.sp.map_reduce0([f](const proxy& p) {return p.get_stats().*f;}, sstables::estimated_histogram(),
-            sstables::merge).then([](const sstables::estimated_histogram& val) {
+static future<utils::rate_moving_average>  sum_timed_rate(distributed<proxy>& d, utils::timed_rate_moving_average proxy::stats::*f) {
+    return d.map_reduce0([f](const proxy& p) {return (p.get_stats().*f).rate();}, utils::rate_moving_average(),
+            std::plus<utils::rate_moving_average>());
+}
+
+static future<json::json_return_type>  sum_timed_rate_as_obj(distributed<proxy>& d, utils::timed_rate_moving_average proxy::stats::*f) {
+    return sum_timed_rate(d, f).then([](const utils::rate_moving_average& val) {
+        httpd::utils_json::rate_moving_average m;
+        m = val;
+        return make_ready_future<json::json_return_type>(m);
+    });
+}
+
+static future<json::json_return_type>  sum_timed_rate_as_long(distributed<proxy>& d, utils::timed_rate_moving_average proxy::stats::*f) {
+    return sum_timed_rate(d, f).then([](const utils::rate_moving_average& val) {
+        return make_ready_future<json::json_return_type>(val.count);
+    });
+}
+
+static future<json::json_return_type>  sum_estimated_histogram(http_context& ctx, utils::estimated_histogram proxy::stats::*f) {
+    return ctx.sp.map_reduce0([f](const proxy& p) {return p.get_stats().*f;}, utils::estimated_histogram(),
+            utils::estimated_histogram_merge).then([](const utils::estimated_histogram& val) {
        utils_json::estimated_histogram res;
        res = val;
        return make_ready_future<json::json_return_type>(res);
    });
 }

-static future<json::json_return_type>  total_latency(http_context& ctx, utils::ihistogram proxy::stats::*f) {
-    return ctx.sp.map_reduce0([f](const proxy& p) {return (p.get_stats().*f).mean * (p.get_stats().*f).count;}, 0.0,
+static future<json::json_return_type>  total_latency(http_context& ctx, utils::timed_rate_moving_average_and_histogram proxy::stats::*f) {
+    return ctx.sp.map_reduce0([f](const proxy& p) {return (p.get_stats().*f).hist.mean * (p.get_stats().*f).hist.count;}, 0.0,
            std::plus<double>()).then([](double val) {
        int64_t res = val;
        return make_ready_future<json::json_return_type>(res);
@@ -291,41 +310,77 @@ void set_storage_proxy(http_context& ctx, routes& r) {
    });

    sp::get_read_metrics_timeouts.set(r, [&ctx](std::unique_ptr<request> req) {
-        return sum_stats(ctx.sp, &proxy::stats::read_timeouts);
+        return sum_timed_rate_as_long(ctx.sp, &proxy::stats::read_timeouts);
    });

    sp::get_read_metrics_unavailables.set(r, [&ctx](std::unique_ptr<request> req) {
-        return sum_stats(ctx.sp, &proxy::stats::read_unavailables);
+        return sum_timed_rate_as_long(ctx.sp, &proxy::stats::read_unavailables);
    });

    sp::get_range_metrics_timeouts.set(r, [&ctx](std::unique_ptr<request> req) {
-        return sum_stats(ctx.sp, &proxy::stats::range_slice_timeouts);
+        return sum_timed_rate_as_long(ctx.sp, &proxy::stats::range_slice_timeouts);
    });

    sp::get_range_metrics_unavailables.set(r, [&ctx](std::unique_ptr<request> req) {
-        return sum_stats(ctx.sp, &proxy::stats::range_slice_unavailables);
+        return sum_timed_rate_as_long(ctx.sp, &proxy::stats::range_slice_unavailables);
    });

    sp::get_write_metrics_timeouts.set(r, [&ctx](std::unique_ptr<request> req) {
-        return sum_stats(ctx.sp, &proxy::stats::write_timeouts);
+        return sum_timed_rate_as_long(ctx.sp, &proxy::stats::write_timeouts);
    });

    sp::get_write_metrics_unavailables.set(r, [&ctx](std::unique_ptr<request> req) {
-        return sum_stats(ctx.sp, &proxy::stats::write_unavailables);
+        return sum_timed_rate_as_long(ctx.sp, &proxy::stats::write_unavailables);
    });

-    sp::get_range_metrics_latency_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
+    sp::get_read_metrics_timeouts_rates.set(r, [&ctx](std::unique_ptr<request> req) {
+        return sum_timed_rate_as_obj(ctx.sp, &proxy::stats::read_timeouts);
+    });
+
+    sp::get_read_metrics_unavailables_rates.set(r, [&ctx](std::unique_ptr<request> req) {
+        return sum_timed_rate_as_obj(ctx.sp, &proxy::stats::read_unavailables);
+    });
+
+    sp::get_range_metrics_timeouts_rates.set(r, [&ctx](std::unique_ptr<request> req) {
+        return sum_timed_rate_as_obj(ctx.sp, &proxy::stats::range_slice_timeouts);
+    });
+
+    sp::get_range_metrics_unavailables_rates.set(r, [&ctx](std::unique_ptr<request> req) {
+        return sum_timed_rate_as_obj(ctx.sp, &proxy::stats::range_slice_unavailables);
+    });
+
+    sp::get_write_metrics_timeouts_rates.set(r, [&ctx](std::unique_ptr<request> req) {
+        return sum_timed_rate_as_obj(ctx.sp, &proxy::stats::write_timeouts);
+    });
+
+    sp::get_write_metrics_unavailables_rates.set(r, [&ctx](std::unique_ptr<request> req) {
+        return sum_timed_rate_as_obj(ctx.sp, &proxy::stats::write_unavailables);
+    });
+
+    sp::get_range_metrics_latency_histogram_depricated.set(r, [&ctx](std::unique_ptr<request> req) {
        return sum_histogram_stats(ctx.sp, &proxy::stats::range);
    });

-    sp::get_write_metrics_latency_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
+    sp::get_write_metrics_latency_histogram_depricated.set(r, [&ctx](std::unique_ptr<request> req) {
        return sum_histogram_stats(ctx.sp, &proxy::stats::write);
    });

-    sp::get_read_metrics_latency_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
+    sp::get_read_metrics_latency_histogram_depricated.set(r, [&ctx](std::unique_ptr<request> req) {
        return sum_histogram_stats(ctx.sp, &proxy::stats::read);
    });

+    sp::get_range_metrics_latency_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
+        return sum_timer_stats(ctx.sp, &proxy::stats::range);
+    });
+
+    sp::get_write_metrics_latency_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
+        return sum_timer_stats(ctx.sp, &proxy::stats::write);
+    });
+
+    sp::get_read_metrics_latency_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
+        return sum_timer_stats(ctx.sp, &proxy::stats::read);
+    });
+
    sp::get_read_estimated_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
        return sum_estimated_histogram(ctx, &proxy::stats::estimated_read);
    });
@@ -342,7 +397,7 @@ void set_storage_proxy(http_context& ctx, routes& r) {
    });

    sp::get_range_estimated_histogram.set(r, [&ctx](std::unique_ptr<request> req) {
-        return sum_histogram_stats(ctx.sp, &proxy::stats::read);
+        return sum_timer_stats(ctx.sp, &proxy::stats::read);
    });

    sp::get_range_latency.set(r, [&ctx](std::unique_ptr<request> req) {
--- a/api/storage_proxy.hh
+++ b/api/storage_proxy.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/storage_service.cc
+++ b/api/storage_service.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -31,6 +31,7 @@
 #include "locator/snitch_base.hh"
 #include "column_family.hh"
 #include "log.hh"
+#include "release.hh"

 namespace api {

@@ -121,6 +122,9 @@ void set_storage_service(http_context& ctx, routes& r) {
        return service::get_local_storage_service().get_release_version();
    });

+    ss::get_scylla_release_version.set(r, [](const_req req) {
+        return scylla_version();
+    });
    ss::get_schema_version.set(r, [](const_req req) {
        return service::get_local_storage_service().get_schema_version();
    });
@@ -382,21 +386,21 @@ void set_storage_service(http_context& ctx, routes& r) {

    ss::remove_node.set(r, [](std::unique_ptr<request> req) {
        auto host_id = req->get_query_param("host_id");
-        return service::get_local_storage_service().remove_node(host_id).then([] {
+        return service::get_local_storage_service().removenode(host_id).then([] {
            return make_ready_future<json::json_return_type>(json_void());
        });
    });

    ss::get_removal_status.set(r, [](std::unique_ptr<request> req) {
-        //TBD
-        unimplemented();
-        return make_ready_future<json::json_return_type>("");
+        return service::get_local_storage_service().get_removal_status().then([] (auto status) {
+            return make_ready_future<json::json_return_type>(status);
+        });
    });

    ss::force_remove_completion.set(r, [](std::unique_ptr<request> req) {
-        //TBD
-        unimplemented();
-        return make_ready_future<json::json_return_type>(json_void());
+        return service::get_local_storage_service().force_remove_completion().then([] {
+            return make_ready_future<json::json_return_type>(json_void());
+        });
    });

    ss::set_logging_level.set(r, [](std::unique_ptr<request> req) {
@@ -659,16 +663,53 @@ void set_storage_service(http_context& ctx, routes& r) {
    });

    ss::set_trace_probability.set(r, [](std::unique_ptr<request> req) {
-        //TBD
-        unimplemented();
        auto probability = req->get_query_param("probability");
-        return make_ready_future<json::json_return_type>(json_void());
+        try {
+            double real_prob = std::stod(probability.c_str());
+            return tracing::tracing::tracing_instance().invoke_on_all([real_prob] (auto& local_tracing) {
+                local_tracing.set_trace_probability(real_prob);
+            }).then([] {
+                return make_ready_future<json::json_return_type>(json_void());
+            });
+        } catch (...) {
+            throw httpd::bad_param_exception(sprint("Bad format of a probability value: \"%s\"", probability.c_str()));
+        }
+
    });

    ss::get_trace_probability.set(r, [](std::unique_ptr<request> req) {
-        //TBD
-        unimplemented();
-        return make_ready_future<json::json_return_type>(0);
+        return make_ready_future<json::json_return_type>(tracing::tracing::get_local_tracing_instance().get_trace_probability());
+    });
+
+    ss::get_slow_query_info.set(r, [](const_req req) {
+        ss::slow_query_info res;
+        res.enable = tracing::tracing::get_local_tracing_instance().slow_query_tracing_enabled();
+        res.ttl = tracing::tracing::get_local_tracing_instance().slow_query_record_ttl().count() ;
+        res.threshold = tracing::tracing::get_local_tracing_instance().slow_query_threshold().count();
+        return res;
+    });
+
+    ss::set_slow_query.set(r, [](std::unique_ptr<request> req) {
+        auto enable = req->get_query_param("enable");
+        auto ttl = req->get_query_param("ttl");
+        auto threshold = req->get_query_param("threshold");
+        try {
+            return tracing::tracing::tracing_instance().invoke_on_all([enable, ttl, threshold] (auto& local_tracing) {
+                if (threshold != "") {
+                    local_tracing.set_slow_query_threshold(std::chrono::microseconds(std::stol(threshold.c_str())));
+                }
+                if (ttl != "") {
+                    local_tracing.set_slow_query_record_ttl(std::chrono::seconds(std::stol(ttl.c_str())));
+                }
+                if (enable != "") {
+                    local_tracing.set_slow_query_enabled(strcasecmp(enable.c_str(), "true") == 0);
+                }
+            }).then([] {
+                return make_ready_future<json::json_return_type>(json_void());
+            });
+        } catch (...) {
+            throw httpd::bad_param_exception(sprint("Bad format value: "));
+        }
    });

    ss::enable_auto_compaction.set(r, [&ctx](std::unique_ptr<request> req) {
--- a/api/storage_service.hh
+++ b/api/storage_service.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/stream_manager.cc
+++ b/api/stream_manager.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/stream_manager.hh
+++ b/api/stream_manager.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/system.cc
+++ b/api/system.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/api/system.hh
+++ b/api/system.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/atomic_cell.hh
+++ b/atomic_cell.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2015 Cloudius Systems, Ltd.
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -54,9 +54,9 @@ class atomic_cell_or_collection;
 */
 class atomic_cell_type final {
 private:
-    static constexpr int8_t DEAD_FLAGS = 0;
    static constexpr int8_t LIVE_FLAG = 0x01;
    static constexpr int8_t EXPIRY_FLAG = 0x02; // When present, expiry field is present. Set only for live cells
+    static constexpr int8_t REVERT_FLAG = 0x04; // transient flag used to efficiently implement ReversiblyMergeable for atomic cells.
    static constexpr unsigned flags_size = 1;
    static constexpr unsigned timestamp_offset = flags_size;
    static constexpr unsigned timestamp_size = 8;
@@ -67,14 +67,21 @@ private:
    static constexpr unsigned ttl_offset = expiry_offset + expiry_size;
    static constexpr unsigned ttl_size = 4;
 private:
+    static bool is_revert_set(bytes_view cell) {
+        return cell[0] & REVERT_FLAG;
+    }
+    template<typename BytesContainer>
+    static void set_revert(BytesContainer& cell, bool revert) {
+        cell[0] = (cell[0] & ~REVERT_FLAG) | (revert * REVERT_FLAG);
+    }
    static bool is_live(const bytes_view& cell) {
-        return cell[0] != DEAD_FLAGS;
+        return cell[0] & LIVE_FLAG;
    }
    static bool is_live_and_has_ttl(const bytes_view& cell) {
        return cell[0] & EXPIRY_FLAG;
    }
    static bool is_dead(const bytes_view& cell) {
-        return cell[0] == DEAD_FLAGS;
+        return !is_live(cell);
    }
    // Can be called on live and dead cells
    static api::timestamp_type timestamp(const bytes_view& cell) {
@@ -106,7 +113,7 @@ private:
    }
    static managed_bytes make_dead(api::timestamp_type timestamp, gc_clock::time_point deletion_time) {
        managed_bytes b(managed_bytes::initialized_later(), flags_size + timestamp_size + deletion_time_size);
-        b[0] = DEAD_FLAGS;
+        b[0] = 0;
        set_field(b, timestamp_offset, timestamp);
        set_field(b, deletion_time_offset, deletion_time.time_since_epoch().count());
        return b;
@@ -140,8 +147,11 @@ protected:
    ByteContainer _data;
 protected:
    atomic_cell_base(ByteContainer&& data) : _data(std::forward<ByteContainer>(data)) { }
-    atomic_cell_base(const ByteContainer& data) : _data(data) { }
+    friend class atomic_cell_or_collection;
 public:
+    bool is_revert_set() const {
+        return atomic_cell_type::is_revert_set(_data);
+    }
    bool is_live() const {
        return atomic_cell_type::is_live(_data);
    }
@@ -187,10 +197,13 @@ public:
    bytes_view serialize() const {
        return _data;
    }
+    void set_revert(bool revert) {
+        atomic_cell_type::set_revert(_data, revert);
+    }
 };

 class atomic_cell_view final : public atomic_cell_base<bytes_view> {
-    atomic_cell_view(bytes_view data) : atomic_cell_base(data) {}
+    atomic_cell_view(bytes_view data) : atomic_cell_base(std::move(data)) {}
 public:
    static atomic_cell_view from_bytes(bytes_view data) { return atomic_cell_view(data); }

@@ -198,6 +211,11 @@ public:
    friend std::ostream& operator<<(std::ostream& os, const atomic_cell_view& acv);
 };

+class atomic_cell_ref final : public atomic_cell_base<managed_bytes&> {
+public:
+    atomic_cell_ref(managed_bytes& buf) : atomic_cell_base(buf) {}
+};
+
 class atomic_cell final : public atomic_cell_base<managed_bytes> {
    atomic_cell(managed_bytes b) : atomic_cell_base(std::move(b)) {}
 public:
@@ -218,11 +236,19 @@ public:
    static atomic_cell make_live(api::timestamp_type timestamp, bytes_view value) {
        return atomic_cell_type::make_live(timestamp, value);
    }
+    static atomic_cell make_live(api::timestamp_type timestamp, const bytes& value) {
+        return make_live(timestamp, bytes_view(value));
+    }
    static atomic_cell make_live(api::timestamp_type timestamp, bytes_view value,
        gc_clock::time_point expiry, gc_clock::duration ttl)
    {
        return atomic_cell_type::make_live(timestamp, value, expiry, ttl);
    }
+    static atomic_cell make_live(api::timestamp_type timestamp, const bytes& value,
+                                 gc_clock::time_point expiry, gc_clock::duration ttl)
+    {
+        return make_live(timestamp, bytes_view(value), expiry, ttl);
+    }
    static atomic_cell make_live(api::timestamp_type timestamp, bytes_view value, ttl_opt ttl) {
        if (!ttl) {
            return atomic_cell_type::make_live(timestamp, value);
--- a/atomic_cell_hash.hh
+++ b/atomic_cell_hash.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2015 Cloudius Systems, Ltd.
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -57,3 +57,19 @@ struct appending_hash<atomic_cell_view> {
        }
    }
 };
+
+template<>
+struct appending_hash<atomic_cell> {
+    template<typename Hasher>
+    void operator()(Hasher& h, const atomic_cell& cell) const {
+        feed_hash(h, static_cast<atomic_cell_view>(cell));
+    }
+};
+
+template<>
+struct appending_hash<collection_mutation> {
+    template<typename Hasher>
+    void operator()(Hasher& h, const collection_mutation& cm) const {
+        feed_hash(h, static_cast<collection_mutation_view>(cm));
+    }
+};
--- a/atomic_cell_or_collection.hh
+++ b/atomic_cell_or_collection.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2015 Cloudius Systems, Ltd.
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -27,6 +27,8 @@

 // A variant type that can hold either an atomic_cell, or a serialized collection.
 // Which type is stored is determined by the schema.
+// Has an "empty" state.
+// Objects moved-from are left in an empty state.
 class atomic_cell_or_collection final {
    managed_bytes _data;
 private:
@@ -36,6 +38,7 @@ public:
    atomic_cell_or_collection(atomic_cell ac) : _data(std::move(ac._data)) {}
    static atomic_cell_or_collection from_atomic_cell(atomic_cell data) { return { std::move(data._data) }; }
    atomic_cell_view as_atomic_cell() const { return atomic_cell_view::from_bytes(_data); }
+    atomic_cell_ref as_atomic_cell_ref() { return { _data }; }
    atomic_cell_or_collection(collection_mutation cm) : _data(std::move(cm.data)) {}
    explicit operator bool() const {
        return !_data.empty();
@@ -60,5 +63,8 @@ public:
            ::feed_hash(as_collection_mutation(), h, def.type);
        }
    }
+    size_t memory_usage() const {
+        return _data.memory_usage();
+    }
    friend std::ostream& operator<<(std::ostream&, const atomic_cell_or_collection&);
 };
--- a/auth/auth.cc
+++ b/auth/auth.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -40,14 +40,19 @@
 */
 #include <seastar/core/sleep.hh>

+#include <seastar/core/distributed.hh>
+
 #include "auth.hh"
 #include "authenticator.hh"
+#include "authorizer.hh"
 #include "database.hh"
 #include "cql3/query_processor.hh"
-#include "cql3/statements/cf_statement.hh"
+#include "cql3/statements/raw/cf_statement.hh"
 #include "cql3/statements/create_table_statement.hh"
 #include "db/config.hh"
 #include "service/migration_manager.hh"
+#include "utils/loading_cache.hh"
+#include "utils/hash.hh"

 const sstring auth::auth::DEFAULT_SUPERUSER_NAME("cassandra");
 const sstring auth::auth::AUTH_KS("system_auth");
@@ -76,13 +81,10 @@ class auth_migration_listener : public service::migration_listener {
    void on_update_aggregate(const sstring& ks_name, const sstring& aggregate_name) override {}

    void on_drop_keyspace(const sstring& ks_name) override {
-        // TODO:
-        //DatabaseDescriptor.getAuthorizer().revokeAll(DataResource.keyspace(ksName));
-
+        auth::authorizer::get().revoke_all(auth::data_resource(ks_name));
    }
    void on_drop_column_family(const sstring& ks_name, const sstring& cf_name) override {
-        // TODO:
-        //DatabaseDescriptor.getAuthorizer().revokeAll(DataResource.columnFamily(ksName, cfName));
+        auth::authorizer::get().revoke_all(auth::data_resource(ks_name, cf_name));
    }
    void on_drop_user_type(const sstring& ks_name, const sstring& type_name) override {}
    void on_drop_function(const sstring& ks_name, const sstring& function_name) override {}
@@ -91,6 +93,64 @@ class auth_migration_listener : public service::migration_listener {

 static auth_migration_listener auth_migration;

+namespace std {
+template <>
+struct hash<auth::data_resource> {
+    size_t operator()(const auth::data_resource & v) const {
+        return v.hash_value();
+    }
+};
+
+template <>
+struct hash<auth::authenticated_user> {
+    size_t operator()(const auth::authenticated_user & v) const {
+        return utils::tuple_hash()(v.name(), v.is_anonymous());
+    }
+};
+}
+
+class auth::auth::permissions_cache {
+public:
+    typedef utils::loading_cache<std::pair<authenticated_user, data_resource>, permission_set, utils::tuple_hash> cache_type;
+    typedef typename cache_type::key_type key_type;
+
+    permissions_cache()
+                    : permissions_cache(
+                                    cql3::get_local_query_processor().db().local().get_config()) {
+    }
+
+    permissions_cache(const db::config& cfg)
+                    : _cache(cfg.permissions_cache_max_entries(), expiry(cfg),
+                                    std::chrono::milliseconds(
+                                                    cfg.permissions_validity_in_ms()),
+                                    [](const key_type& k) {
+                                        logger.debug("Refreshing permissions for {}", k.first.name());
+                                        return authorizer::get().authorize(::make_shared<authenticated_user>(k.first), k.second);
+                                    }) {
+    }
+
+    static std::chrono::milliseconds expiry(const db::config& cfg) {
+        auto exp = cfg.permissions_update_interval_in_ms();
+        if (exp == 0 || exp == std::numeric_limits<uint32_t>::max()) {
+            exp = cfg.permissions_validity_in_ms();
+        }
+        return std::chrono::milliseconds(exp);
+    }
+
+    future<> stop() {
+        return make_ready_future<>();
+    }
+
+    future<permission_set> get(::shared_ptr<authenticated_user> user, data_resource resource) {
+        return _cache.get(key_type(*user, std::move(resource)));
+    }
+
+private:
+    cache_type _cache;
+};
+
+static distributed<auth::auth::permissions_cache> perm_cache;
+
 /**
 * Poor mans job schedule. For maximum 2 jobs. Sic.
 * Still does nothing more clever than waiting 10 seconds
@@ -163,14 +223,22 @@ bool auth::auth::is_class_type(const sstring& type, const sstring& classname) {
 future<> auth::auth::setup() {
    auto& db = cql3::get_local_query_processor().db().local();
    auto& cfg = db.get_config();
-    auto type = cfg.authenticator();

-    if (is_class_type(type, authenticator::ALLOW_ALL_AUTHENTICATOR_NAME)) {
-        return authenticator::setup(type).discard_result(); // just create the object
+    future<> f = perm_cache.start();
+
+    if (is_class_type(cfg.authenticator(),
+                    authenticator::ALLOW_ALL_AUTHENTICATOR_NAME)
+                    && is_class_type(cfg.authorizer(),
+                                    authorizer::ALLOW_ALL_AUTHORIZER_NAME)
+                                    ) {
+        // just create the objects
+        return f.then([&cfg] {
+            return authenticator::setup(cfg.authenticator());
+        }).then([&cfg] {
+            return authorizer::setup(cfg.authorizer());
+        });
    }

-    future<> f = make_ready_future();
-
    if (!db.has_keyspace(AUTH_KS)) {
        std::map<sstring, sstring> opts;
        opts["replication_factor"] = "1";
@@ -182,10 +250,10 @@ future<> auth::auth::setup() {
        return setup_table(USERS_CF, sprint("CREATE TABLE %s.%s (%s text, %s boolean, PRIMARY KEY(%s)) WITH gc_grace_seconds=%d",
                                        AUTH_KS, USERS_CF, USER_NAME, SUPER, USER_NAME,
                                        90 * 24 * 60 * 60)); // 3 months.
-    }).then([type] {
-        return authenticator::setup(type).discard_result();
-    }).then([] {
-        // TODO authorizer
+    }).then([&cfg] {
+        return authenticator::setup(cfg.authenticator());
+    }).then([&cfg] {
+        return authorizer::setup(cfg.authorizer());
    }).then([] {
        service::get_local_migration_manager().register_listener(&auth_migration); // again, only one shard...
        // instead of once-timer, just schedule this later
@@ -216,9 +284,15 @@ future<> auth::auth::shutdown() {
    // db-env-shutdown != process shutdown
    return smp::invoke_on_all([] {
        thread_waiters().clear();
+    }).then([] {
+        return perm_cache.stop();
    });
 }

+future<auth::permission_set> auth::auth::get_permissions(::shared_ptr<authenticated_user> user, data_resource resource) {
+    return perm_cache.local().get(std::move(user), std::move(resource));
+}
+
 static db::consistency_level consistency_for_user(const sstring& username) {
    if (username == auth::auth::DEFAULT_SUPERUSER_NAME) {
        return db::consistency_level::QUORUM;
@@ -274,15 +348,18 @@ future<> auth::auth::setup_table(const sstring& name, const sstring& cql) {
        return make_ready_future();
    }

-    ::shared_ptr<cql3::statements::cf_statement> parsed = static_pointer_cast<
-                    cql3::statements::cf_statement>(cql3::query_processor::parse_statement(cql));
+    ::shared_ptr<cql3::statements::raw::cf_statement> parsed = static_pointer_cast<
+                    cql3::statements::raw::cf_statement>(cql3::query_processor::parse_statement(cql));
    parsed->prepare_keyspace(AUTH_KS);
    ::shared_ptr<cql3::statements::create_table_statement> statement =
                    static_pointer_cast<cql3::statements::create_table_statement>(
                                    parsed->prepare(db)->statement);
-    // Origin sets "Legacy Cf Id" for the new table. We have no need to be
-    // pre-2.1 compatible (afaik), so lets skip a whole lotta hoolaballo
-    return statement->announce_migration(qp.proxy(), false).then([statement](bool) {});
+    auto schema = statement->get_cf_meta_data();
+    auto uuid = generate_legacy_id(schema->ks_name(), schema->cf_name());
+
+    schema_builder b(schema);
+    b.set_uuid(uuid);
+    return service::get_local_migration_manager().announce_new_column_family(b.build(), false);
 }

 future<bool> auth::auth::has_existing_users(const sstring& cfname, const sstring& def_user_name, const sstring& name_column) {
--- a/auth/auth.hh
+++ b/auth/auth.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -44,13 +44,21 @@
 #include <chrono>
 #include <seastar/core/sstring.hh>
 #include <seastar/core/future.hh>
+#include <seastar/core/shared_ptr.hh>
+

 #include "exceptions/exceptions.hh"
+#include "permission.hh"
+#include "data_resource.hh"

 namespace auth {

+class authenticated_user;
+
 class auth {
 public:
+    class permissions_cache;
+
    static const sstring DEFAULT_SUPERUSER_NAME;
    static const sstring AUTH_KS;
    static const sstring USERS_CF;
@@ -58,12 +66,7 @@ public:

    static bool is_class_type(const sstring& type, const sstring& classname);

-#if 0
-    public static Set<Permission> getPermissions(AuthenticatedUser user, IResource resource)
-    {
-        return permissionsCache.getPermissions(user, resource);
-    }
-#endif
+    static future<permission_set> get_permissions(::shared_ptr<authenticated_user>, data_resource);

    /**
     * Checks if the username is stored in AUTH_KS.USERS_CF.
--- a/auth/authenticated_user.cc
+++ b/auth/authenticated_user.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -41,6 +41,7 @@


 #include "authenticated_user.hh"
+#include "auth.hh"

 const sstring auth::authenticated_user::ANONYMOUS_USERNAME("anonymous");

@@ -52,10 +53,20 @@ auth::authenticated_user::authenticated_user(sstring name)
                : _name(name), _anon(false)
 {}

+auth::authenticated_user::authenticated_user(authenticated_user&&) = default;
+auth::authenticated_user::authenticated_user(const authenticated_user&) = default;
+
 const sstring& auth::authenticated_user::name() const {
    return _anon ? ANONYMOUS_USERNAME : _name;
 }

+future<bool> auth::authenticated_user::is_super() const {
+    if (is_anonymous()) {
+        return make_ready_future<bool>(false);
+    }
+    return auth::auth::is_super_user(_name);
+}
+
 bool auth::authenticated_user::operator==(const authenticated_user& v) const {
    return _anon ? v._anon : _name == v._name;
 }
--- a/auth/authenticated_user.hh
+++ b/auth/authenticated_user.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -42,6 +42,7 @@
 #pragma once

 #include <seastar/core/sstring.hh>
+#include <seastar/core/future.hh>

 namespace auth {

@@ -51,6 +52,8 @@ public:

    authenticated_user();
    authenticated_user(sstring name);
+    authenticated_user(authenticated_user&&);
+    authenticated_user(const authenticated_user&);

    const sstring& name() const;

@@ -60,7 +63,7 @@ public:
     * Im most cased, though not necessarily, a superuser will have Permission.ALL on every resource
     * (depends on IAuthorizer implementation).
     */
-    bool is_super() const;
+    future<bool> is_super() const;

    /**
     * If IAuthenticator doesn't require authentication, this method may return true.
--- a/auth/authenticator.cc
+++ b/auth/authenticator.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -49,6 +49,22 @@ const sstring auth::authenticator::USERNAME_KEY("username");
 const sstring auth::authenticator::PASSWORD_KEY("password");
 const sstring auth::authenticator::ALLOW_ALL_AUTHENTICATOR_NAME("org.apache.cassandra.auth.AllowAllAuthenticator");

+auth::authenticator::option auth::authenticator::string_to_option(const sstring& name) {
+    if (strcasecmp(name.c_str(), "password") == 0) {
+        return option::PASSWORD;
+    }
+    throw std::invalid_argument(name);
+}
+
+sstring auth::authenticator::option_to_string(option opt) {
+    switch (opt) {
+    case option::PASSWORD:
+        return "PASSWORD";
+    default:
+        throw std::invalid_argument(sprint("Unknown option {}", opt));
+    }
+}
+
 /**
 * Authenticator is assumed to be a fully state-less immutable object (note all the const).
 * We thus store a single instance globally, since it should be safe/ok.
@@ -84,8 +100,9 @@ auth::authenticator::setup(const sstring& type) throw (exceptions::configuration
            future<> drop(sstring username) throw(exceptions::request_validation_exception, exceptions::request_execution_exception) override {
                return make_ready_future();
            }
-            resource_ids protected_resources() const override {
-                return resource_ids();
+            const resource_ids& protected_resources() const override {
+                static const resource_ids ids;
+                return ids;
            }
            ::shared_ptr<sasl_challenge> new_sasl_challenge() const override {
                throw std::runtime_error("Should not reach");
--- a/auth/authenticator.hh
+++ b/auth/authenticator.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -79,15 +79,13 @@ public:
        PASSWORD
    };

+    static option string_to_option(const sstring&);
+    static sstring option_to_string(option);
+
    using option_set = enum_set<super_enum<option, option::PASSWORD>>;
    using option_map = std::unordered_map<option, boost::any, enum_hash<option>>;
    using credentials_map = std::unordered_map<sstring, sstring>;

-    /**
-     * Resource id mappings, i.e. keyspace and/or column families.
-     */
-    using resource_ids = std::set<data_resource>;
-
    /**
     * Setup is called once upon system startup to initialize the IAuthenticator.
     *
@@ -174,7 +172,7 @@ public:
     * @return Keyspaces, column families that will be unmodifiable by users; other resources.
     * @see resource_ids
     */
-    virtual resource_ids protected_resources() const = 0;
+    virtual const resource_ids& protected_resources() const = 0;

    class sasl_challenge {
    public:
@@ -194,5 +192,9 @@ public:
    virtual ::shared_ptr<sasl_challenge> new_sasl_challenge() const = 0;
 };

+inline std::ostream& operator<<(std::ostream& os, authenticator::option opt) {
+    return os << authenticator::option_to_string(opt);
+}
+
 }

--- a/auth/authorizer.cc
+++ b/auth/authorizer.cc
@@ -0,0 +1,104 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*
+ * Copyright (C) 2016 ScyllaDB
+ *
+ * Modified by ScyllaDB
+ */
+
+/*
+ * This file is part of Scylla.
+ *
+ * Scylla is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Scylla is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#include "authorizer.hh"
+#include "authenticated_user.hh"
+#include "default_authorizer.hh"
+#include "auth.hh"
+#include "db/config.hh"
+
+const sstring auth::authorizer::ALLOW_ALL_AUTHORIZER_NAME("org.apache.cassandra.auth.AllowAllAuthorizer");
+
+/**
+ * Authenticator is assumed to be a fully state-less immutable object (note all the const).
+ * We thus store a single instance globally, since it should be safe/ok.
+ */
+static std::unique_ptr<auth::authorizer> global_authorizer;
+
+future<>
+auth::authorizer::setup(const sstring& type) {
+    if (auth::auth::is_class_type(type, ALLOW_ALL_AUTHORIZER_NAME)) {
+        class allow_all_authorizer : public authorizer {
+        public:
+            future<permission_set> authorize(::shared_ptr<authenticated_user>, data_resource) const override {
+                return make_ready_future<permission_set>(permissions::ALL);
+            }
+            future<> grant(::shared_ptr<authenticated_user>, permission_set, data_resource, sstring) override {
+                throw exceptions::invalid_request_exception("GRANT operation is not supported by AllowAllAuthorizer");
+            }
+            future<> revoke(::shared_ptr<authenticated_user>, permission_set, data_resource, sstring) override {
+                throw exceptions::invalid_request_exception("REVOKE operation is not supported by AllowAllAuthorizer");
+            }
+            future<std::vector<permission_details>> list(::shared_ptr<authenticated_user> performer, permission_set, optional<data_resource>, optional<sstring>) const override {
+                throw exceptions::invalid_request_exception("LIST PERMISSIONS operation is not supported by AllowAllAuthorizer");
+            }
+            future<> revoke_all(sstring dropped_user) override {
+                return make_ready_future();
+            }
+            future<> revoke_all(data_resource) override {
+                return make_ready_future();
+            }
+            const resource_ids& protected_resources() override {
+                static const resource_ids ids;
+                return ids;
+            }
+            future<> validate_configuration() const override {
+                return make_ready_future();
+            }
+        };
+
+        global_authorizer = std::make_unique<allow_all_authorizer>();
+    } else if (auth::auth::is_class_type(type, default_authorizer::DEFAULT_AUTHORIZER_NAME)) {
+        auto da = std::make_unique<default_authorizer>();
+        auto f = da->init();
+        return f.then([da = std::move(da)]() mutable {
+            global_authorizer = std::move(da);
+        });
+    } else {
+        throw exceptions::configuration_exception("Invalid authorizer type: " + type);
+    }
+    return make_ready_future();
+}
+
+auth::authorizer& auth::authorizer::get() {
+    assert(global_authorizer);
+    return *global_authorizer;
+}
--- a/auth/authorizer.hh
+++ b/auth/authorizer.hh
@@ -0,0 +1,171 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*
+ * Copyright (C) 2016 ScyllaDB
+ *
+ * Modified by ScyllaDB
+ */
+
+/*
+ * This file is part of Scylla.
+ *
+ * Scylla is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Scylla is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#pragma once
+
+#include <vector>
+#include <tuple>
+
+#include <experimental/optional>
+#include <seastar/core/future.hh>
+#include <seastar/core/shared_ptr.hh>
+
+#include "permission.hh"
+#include "data_resource.hh"
+
+namespace auth {
+
+class authenticated_user;
+
+struct permission_details {
+    sstring user;
+    data_resource resource;
+    permission_set permissions;
+
+    bool operator<(const permission_details& v) const {
+        return std::tie(user, resource, permissions) < std::tie(v.user, v.resource, v.permissions);
+    }
+};
+
+using std::experimental::optional;
+
+class authorizer {
+public:
+    static const sstring ALLOW_ALL_AUTHORIZER_NAME;
+
+    virtual ~authorizer() {}
+
+    /**
+     * The primary Authorizer method. Returns a set of permissions of a user on a resource.
+     *
+     * @param user Authenticated user requesting authorization.
+     * @param resource Resource for which the authorization is being requested. @see DataResource.
+     * @return Set of permissions of the user on the resource. Should never return empty. Use permission.NONE instead.
+     */
+    virtual future<permission_set> authorize(::shared_ptr<authenticated_user>, data_resource) const = 0;
+
+    /**
+     * Grants a set of permissions on a resource to a user.
+     * The opposite of revoke().
+     *
+     * @param performer User who grants the permissions.
+     * @param permissions Set of permissions to grant.
+     * @param to Grantee of the permissions.
+     * @param resource Resource on which to grant the permissions.
+     *
+     * @throws RequestValidationException
+     * @throws RequestExecutionException
+     */
+    virtual future<> grant(::shared_ptr<authenticated_user> performer, permission_set, data_resource, sstring to) = 0;
+
+    /**
+     * Revokes a set of permissions on a resource from a user.
+     * The opposite of grant().
+     *
+     * @param performer User who revokes the permissions.
+     * @param permissions Set of permissions to revoke.
+     * @param from Revokee of the permissions.
+     * @param resource Resource on which to revoke the permissions.
+     *
+     * @throws RequestValidationException
+     * @throws RequestExecutionException
+     */
+    virtual future<> revoke(::shared_ptr<authenticated_user> performer, permission_set, data_resource, sstring from) = 0;
+
+    /**
+     * Returns a list of permissions on a resource of a user.
+     *
+     * @param performer User who wants to see the permissions.
+     * @param permissions Set of Permission values the user is interested in. The result should only include the matching ones.
+     * @param resource The resource on which permissions are requested. Can be null, in which case permissions on all resources
+     *                 should be returned.
+     * @param of The user whose permissions are requested. Can be null, in which case permissions of every user should be returned.
+     *
+     * @return All of the matching permission that the requesting user is authorized to know about.
+     *
+     * @throws RequestValidationException
+     * @throws RequestExecutionException
+     */
+    virtual future<std::vector<permission_details>> list(::shared_ptr<authenticated_user> performer, permission_set, optional<data_resource>, optional<sstring>) const = 0;
+
+    /**
+     * This method is called before deleting a user with DROP USER query so that a new user with the same
+     * name wouldn't inherit permissions of the deleted user in the future.
+     *
+     * @param droppedUser The user to revoke all permissions from.
+     */
+    virtual future<> revoke_all(sstring dropped_user) = 0;
+
+    /**
+     * This method is called after a resource is removed (i.e. keyspace or a table is dropped).
+     *
+     * @param droppedResource The resource to revoke all permissions on.
+     */
+    virtual future<> revoke_all(data_resource) = 0;
+
+    /**
+     * Set of resources that should be made inaccessible to users and only accessible internally.
+     *
+     * @return Keyspaces, column families that will be unmodifiable by users; other resources.
+     */
+    virtual const resource_ids& protected_resources() = 0;
+
+    /**
+     * Validates configuration of IAuthorizer implementation (if configurable).
+     *
+     * @throws ConfigurationException when there is a configuration error.
+     */
+    virtual future<> validate_configuration() const = 0;
+
+    /**
+     * Setup is called once upon system startup to initialize the IAuthorizer.
+     *
+     * For example, use this method to create any required keyspaces/column families.
+     */
+    static future<> setup(const sstring& type);
+
+    /**
+     * Returns the system authorizer. Must have called setup before calling this.
+     */
+    static authorizer& get();
+};
+
+}
--- a/auth/data_resource.cc
+++ b/auth/data_resource.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -47,11 +47,8 @@
 const sstring auth::data_resource::ROOT_NAME("data");

 auth::data_resource::data_resource(level l, const sstring& ks, const sstring& cf)
-    : _ks(ks), _cf(cf)
+    : _level(l), _ks(ks), _cf(cf)
 {
-    if (l != get_level()) {
-        throw std::invalid_argument("level/keyspace/column mismatch");
-    }
 }

 auth::data_resource::data_resource()
@@ -67,14 +64,7 @@ auth::data_resource::data_resource(const sstring& ks, const sstring& cf)
 {}

 auth::data_resource::level auth::data_resource::get_level() const {
-    if (!_cf.empty()) {
-        assert(!_ks.empty());
-        return level::COLUMN_FAMILY;
-    }
-    if (!_ks.empty()) {
-        return level::KEYSPACE;
-    }
-    return level::ROOT;
+    return _level;
 }

 auth::data_resource auth::data_resource::from_name(
@@ -158,7 +148,15 @@ bool auth::data_resource::exists() const {
 }

 sstring auth::data_resource::to_string() const {
-    return name();
+    switch (get_level()) {
+        case level::ROOT:
+            return "<all keyspaces>";
+        case level::KEYSPACE:
+            return sprint("<keyspace %s>", _ks);
+        case level::COLUMN_FAMILY:
+        default:
+            return sprint("<table %s.%s>", _ks, _cf);
+    }
 }

 bool auth::data_resource::operator==(const data_resource& v) const {
@@ -170,6 +168,6 @@ bool auth::data_resource::operator<(const data_resource& v) const {
 }

 std::ostream& auth::operator<<(std::ostream& os, const data_resource& r) {
-    return os << r.name();
+    return os << r.to_string();
 }

--- a/auth/data_resource.hh
+++ b/auth/data_resource.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -41,7 +41,9 @@

 #pragma once

+#include "utils/hash.hh"
 #include <iosfwd>
+#include <set>
 #include <seastar/core/sstring.hh>

 namespace auth {
@@ -54,6 +56,7 @@ private:

    static const sstring ROOT_NAME;

+    level _level;
    sstring _ks;
    sstring _cf;

@@ -136,8 +139,17 @@ public:

    bool operator==(const data_resource&) const;
    bool operator<(const data_resource&) const;
+
+    size_t hash_value() const {
+        return utils::tuple_hash()(_ks, _cf);
+    }
 };

+/**
+ * Resource id mappings, i.e. keyspace and/or column families.
+ */
+using resource_ids = std::set<data_resource>;
+
 std::ostream& operator<<(std::ostream&, const data_resource&);

 }
--- a/auth/default_authorizer.cc
+++ b/auth/default_authorizer.cc
@@ -0,0 +1,240 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*
+ * Copyright (C) 2016 ScyllaDB
+ *
+ * Modified by ScyllaDB
+ */
+
+/*
+ * This file is part of Scylla.
+ *
+ * Scylla is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Scylla is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#include <unistd.h>
+#include <crypt.h>
+#include <random>
+#include <chrono>
+
+#include <seastar/core/reactor.hh>
+
+#include "auth.hh"
+#include "default_authorizer.hh"
+#include "authenticated_user.hh"
+#include "permission.hh"
+#include "cql3/query_processor.hh"
+#include "exceptions/exceptions.hh"
+#include "log.hh"
+
+const sstring auth::default_authorizer::DEFAULT_AUTHORIZER_NAME(
+                "org.apache.cassandra.auth.CassandraAuthorizer");
+
+static const sstring USER_NAME = "username";
+static const sstring RESOURCE_NAME = "resource";
+static const sstring PERMISSIONS_NAME = "permissions";
+static const sstring PERMISSIONS_CF = "permissions";
+
+static logging::logger logger("default_authorizer");
+
+auth::default_authorizer::default_authorizer() {
+}
+auth::default_authorizer::~default_authorizer() {
+}
+
+future<> auth::default_authorizer::init() {
+    sstring create_table = sprint("CREATE TABLE %s.%s ("
+                    "%s text,"
+                    "%s text,"
+                    "%s set<text>,"
+                    "PRIMARY KEY(%s, %s)"
+                    ") WITH gc_grace_seconds=%d", auth::auth::AUTH_KS,
+                    PERMISSIONS_CF, USER_NAME, RESOURCE_NAME, PERMISSIONS_NAME,
+                    USER_NAME, RESOURCE_NAME, 90 * 24 * 60 * 60); // 3 months.
+
+    return auth::setup_table(PERMISSIONS_CF, create_table);
+}
+
+
+future<auth::permission_set> auth::default_authorizer::authorize(
+                ::shared_ptr<authenticated_user> user, data_resource resource) const {
+    return user->is_super().then([this, user, resource = std::move(resource)](bool is_super) {
+        if (is_super) {
+            return make_ready_future<permission_set>(permissions::ALL);
+        }
+
+        /**
+         * TOOD: could create actual data type for permission (translating string<->perm),
+         * but this seems overkill right now. We still must store strings so...
+         */
+        auto& qp = cql3::get_local_query_processor();
+        auto query = sprint("SELECT %s FROM %s.%s WHERE %s = ? AND %s = ?"
+                        , PERMISSIONS_NAME, auth::AUTH_KS, PERMISSIONS_CF, USER_NAME, RESOURCE_NAME);
+        return qp.process(query, db::consistency_level::LOCAL_ONE, {user->name(), resource.name() })
+                        .then_wrapped([=](future<::shared_ptr<cql3::untyped_result_set>> f) {
+            try {
+                auto res = f.get0();
+
+                if (res->empty() || !res->one().has(PERMISSIONS_NAME)) {
+                    return make_ready_future<permission_set>(permissions::NONE);
+                }
+                return make_ready_future<permission_set>(permissions::from_strings(res->one().get_set<sstring>(PERMISSIONS_NAME)));
+            } catch (exceptions::request_execution_exception& e) {
+                logger.warn("CassandraAuthorizer failed to authorize {} for {}", user->name(), resource);
+                return make_ready_future<permission_set>(permissions::NONE);
+            }
+        });
+    });
+}
+
+#include <boost/range.hpp>
+
+future<> auth::default_authorizer::modify(
+                ::shared_ptr<authenticated_user> performer, permission_set set,
+                data_resource resource, sstring user, sstring op) {
+    // TODO: why does this not check super user?
+    auto& qp = cql3::get_local_query_processor();
+    auto query = sprint("UPDATE %s.%s SET %s = %s %s ? WHERE %s = ? AND %s = ?",
+                    auth::AUTH_KS, PERMISSIONS_CF, PERMISSIONS_NAME,
+                    PERMISSIONS_NAME, op, USER_NAME, RESOURCE_NAME);
+    return qp.process(query, db::consistency_level::ONE, {
+                    permissions::to_strings(set), user, resource.name() }).discard_result();
+}
+
+
+future<> auth::default_authorizer::grant(
+                ::shared_ptr<authenticated_user> performer, permission_set set,
+                data_resource resource, sstring to) {
+    return modify(std::move(performer), std::move(set), std::move(resource), std::move(to), "+");
+}
+
+future<> auth::default_authorizer::revoke(
+                ::shared_ptr<authenticated_user> performer, permission_set set,
+                data_resource resource, sstring from) {
+    return modify(std::move(performer), std::move(set), std::move(resource), std::move(from), "-");
+}
+
+future<std::vector<auth::permission_details>> auth::default_authorizer::list(
+                ::shared_ptr<authenticated_user> performer, permission_set set,
+                optional<data_resource> resource, optional<sstring> user) const {
+    return performer->is_super().then([this, performer, set = std::move(set), resource = std::move(resource), user = std::move(user)](bool is_super) {
+        if (!is_super && (!user || performer->name() != *user)) {
+            throw exceptions::unauthorized_exception(sprint("You are not authorized to view %s's permissions", user ? *user : "everyone"));
+        }
+
+        auto query = sprint("SELECT %s, %s, %s FROM %s.%s", USER_NAME, RESOURCE_NAME, PERMISSIONS_NAME, auth::AUTH_KS, PERMISSIONS_CF);
+        auto& qp = cql3::get_local_query_processor();
+
+        // Oh, look, it is a case where it does not pay off to have
+        // parameters to process in an initializer list.
+        future<::shared_ptr<cql3::untyped_result_set>> f = make_ready_future<::shared_ptr<cql3::untyped_result_set>>();
+
+        if (resource && user) {
+            query += sprint(" WHERE %s = ? AND %s = ?", USER_NAME, RESOURCE_NAME);
+            f = qp.process(query, db::consistency_level::ONE, {*user, resource->name()});
+        } else if (resource) {
+            query += sprint(" WHERE %s = ? ALLOW FILTERING", RESOURCE_NAME);
+            f = qp.process(query, db::consistency_level::ONE, {resource->name()});
+        } else if (user) {
+            query += sprint(" WHERE %s = ?", USER_NAME);
+            f = qp.process(query, db::consistency_level::ONE, {*user});
+        } else {
+            f = qp.process(query, db::consistency_level::ONE, {});
+        }
+
+        return f.then([set](::shared_ptr<cql3::untyped_result_set> res) {
+            std::vector<permission_details> result;
+
+            for (auto& row : *res) {
+                if (row.has(PERMISSIONS_NAME)) {
+                    auto username = row.get_as<sstring>(USER_NAME);
+                    auto resource = data_resource::from_name(row.get_as<sstring>(RESOURCE_NAME));
+                    auto ps = permissions::from_strings(row.get_set<sstring>(PERMISSIONS_NAME));
+                    ps = permission_set::from_mask(ps.mask() & set.mask());
+
+                    result.emplace_back(permission_details {username, resource, ps});
+                }
+            }
+            return make_ready_future<std::vector<permission_details>>(std::move(result));
+        });
+    });
+}
+
+future<> auth::default_authorizer::revoke_all(sstring dropped_user) {
+    auto& qp = cql3::get_local_query_processor();
+    auto query = sprint("DELETE FROM %s.%s WHERE %s = ?", auth::AUTH_KS,
+                    PERMISSIONS_CF, USER_NAME);
+    return qp.process(query, db::consistency_level::ONE, { dropped_user }).discard_result().handle_exception(
+                    [dropped_user](auto ep) {
+                        try {
+                            std::rethrow_exception(ep);
+                        } catch (exceptions::request_execution_exception& e) {
+                            logger.warn("CassandraAuthorizer failed to revoke all permissions of {}: {}", dropped_user, e);
+                        }
+                    });
+}
+
+future<> auth::default_authorizer::revoke_all(data_resource resource) {
+    auto& qp = cql3::get_local_query_processor();
+    auto query = sprint("SELECT %s FROM %s.%s WHERE %s = ? ALLOW FILTERING",
+                    USER_NAME, auth::AUTH_KS, PERMISSIONS_CF, RESOURCE_NAME);
+    return qp.process(query, db::consistency_level::LOCAL_ONE, { resource.name() })
+                    .then_wrapped([resource, &qp](future<::shared_ptr<cql3::untyped_result_set>> f) {
+        try {
+            auto res = f.get0();
+            return parallel_for_each(res->begin(), res->end(), [&qp, res, resource](const cql3::untyped_result_set::row& r) {
+                auto query = sprint("DELETE FROM %s.%s WHERE %s = ? AND %s = ?"
+                                , auth::AUTH_KS, PERMISSIONS_CF, USER_NAME, RESOURCE_NAME);
+                return qp.process(query, db::consistency_level::LOCAL_ONE, { r.get_as<sstring>(USER_NAME), resource.name() })
+                                .discard_result().handle_exception([resource](auto ep) {
+                    try {
+                        std::rethrow_exception(ep);
+                    } catch (exceptions::request_execution_exception& e) {
+                        logger.warn("CassandraAuthorizer failed to revoke all permissions on {}: {}", resource, e);
+                    }
+
+                });
+            });
+        } catch (exceptions::request_execution_exception& e) {
+            logger.warn("CassandraAuthorizer failed to revoke all permissions on {}: {}", resource, e);
+            return make_ready_future();
+        }
+    });
+}
+
+
+const auth::resource_ids& auth::default_authorizer::protected_resources() {
+    static const resource_ids ids({ data_resource(auth::AUTH_KS, PERMISSIONS_CF) });
+    return ids;
+}
+
+future<> auth::default_authorizer::validate_configuration() const {
+    return make_ready_future();
+}
--- a/auth/default_authorizer.hh
+++ b/auth/default_authorizer.hh
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*
+ * Copyright (C) 2016 ScyllaDB
+ *
+ * Modified by ScyllaDB
+ */
+
+/*
+ * This file is part of Scylla.
+ *
+ * Scylla is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Scylla is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#pragma once
+
+#include "authorizer.hh"
+
+namespace auth {
+
+class default_authorizer : public authorizer {
+public:
+    static const sstring DEFAULT_AUTHORIZER_NAME;
+
+    default_authorizer();
+    ~default_authorizer();
+
+    future<> init();
+
+    future<permission_set> authorize(::shared_ptr<authenticated_user>, data_resource) const override;
+
+    future<> grant(::shared_ptr<authenticated_user>, permission_set, data_resource, sstring) override;
+
+    future<> revoke(::shared_ptr<authenticated_user>, permission_set, data_resource, sstring) override;
+
+    future<std::vector<permission_details>> list(::shared_ptr<authenticated_user>, permission_set, optional<data_resource>, optional<sstring>) const override;
+
+    future<> revoke_all(sstring) override;
+
+    future<> revoke_all(data_resource) override;
+
+    const resource_ids& protected_resources() override;
+
+    future<> validate_configuration() const override;
+
+private:
+    future<> modify(::shared_ptr<authenticated_user>, permission_set, data_resource, sstring, sstring);
+};
+
+} /* namespace auth */
+
--- a/auth/password_authenticator.cc
+++ b/auth/password_authenticator.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -218,12 +218,12 @@ future<::shared_ptr<auth::authenticated_user> > auth::password_authenticator::au
    // obsolete prepared statements pretty quickly.
    // Rely on query processing caching statements instead, and lets assume
    // that a map lookup string->statement is not gonna kill us much.
-    auto& qp = cql3::get_local_query_processor();
-    return qp.process(
-                    sprint("SELECT %s FROM %s.%s WHERE %s = ?", SALTED_HASH,
-                                    auth::AUTH_KS, CREDENTIALS_CF, USER_NAME),
-                    consistency_for_user(username), { username }, true).then_wrapped(
-                    [=](future<::shared_ptr<cql3::untyped_result_set>> f) {
+    return futurize_apply([this, username, password] {
+        auto& qp = cql3::get_local_query_processor();
+        return qp.process(sprint("SELECT %s FROM %s.%s WHERE %s = ?", SALTED_HASH,
+                                        auth::AUTH_KS, CREDENTIALS_CF, USER_NAME),
+                        consistency_for_user(username), {username}, true);
+    }).then_wrapped([=](future<::shared_ptr<cql3::untyped_result_set>> f) {
        try {
            auto res = f.get0();
            if (res->empty() || !checkpw(password, res->one().get_as<sstring>(SALTED_HASH))) {
@@ -234,6 +234,8 @@ future<::shared_ptr<auth::authenticated_user> > auth::password_authenticator::au
            std::throw_with_nested(exceptions::authentication_exception("Could not verify password"));
        } catch (exceptions::request_execution_exception& e) {
            std::throw_with_nested(exceptions::authentication_exception(e.what()));
+        } catch (...) {
+            std::throw_with_nested(exceptions::authentication_exception("authentication failed"));
        }
    });
 }
@@ -281,8 +283,9 @@ future<> auth::password_authenticator::drop(sstring username)
    }
 }

-auth::authenticator::resource_ids auth::password_authenticator::protected_resources() const {
-    return { data_resource(auth::AUTH_KS, CREDENTIALS_CF) };
+const auth::resource_ids& auth::password_authenticator::protected_resources() const {
+    static const resource_ids ids({ data_resource(auth::AUTH_KS, CREDENTIALS_CF) });
+    return ids;
 }

 ::shared_ptr<auth::authenticator::sasl_challenge> auth::password_authenticator::new_sasl_challenge() const {
--- a/auth/password_authenticator.hh
+++ b/auth/password_authenticator.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -62,7 +62,7 @@ public:
    future<> create(sstring username, const option_map& options) throw(exceptions::request_validation_exception, exceptions::request_execution_exception) override;
    future<> alter(sstring username, const option_map& options) throw(exceptions::request_validation_exception, exceptions::request_execution_exception) override;
    future<> drop(sstring username) throw(exceptions::request_validation_exception, exceptions::request_execution_exception) override;
-    resource_ids protected_resources() const override;
+    const resource_ids& protected_resources() const override;
    ::shared_ptr<sasl_challenge> new_sasl_challenge() const override;


--- a/auth/permission.cc
+++ b/auth/permission.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -39,11 +39,66 @@
 * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
 */

+#include <unordered_map>
+#include <boost/algorithm/string.hpp>
 #include "permission.hh"

-const auth::permission_set auth::ALL_DATA = auth::permission_set::of
-                < auth::permission::CREATE, auth::permission::ALTER,
-                auth::permission::DROP, auth::permission::SELECT,
-                auth::permission::MODIFY, auth::permission::AUTHORIZE>();
-const auth::permission_set auth::ALL = auth::ALL_DATA;
-const auth::permission_set auth::NONE;
+const auth::permission_set auth::permissions::ALL_DATA =
+                auth::permission_set::of<auth::permission::CREATE,
+                                auth::permission::ALTER, auth::permission::DROP,
+                                auth::permission::SELECT,
+                                auth::permission::MODIFY,
+                                auth::permission::AUTHORIZE>();
+const auth::permission_set auth::permissions::ALL = auth::permissions::ALL_DATA;
+const auth::permission_set auth::permissions::NONE;
+const auth::permission_set auth::permissions::ALTERATIONS =
+                auth::permission_set::of<auth::permission::CREATE,
+                                auth::permission::ALTER, auth::permission::DROP>();
+
+static const std::unordered_map<sstring, auth::permission> permission_names({
+    { "READ", auth::permission::READ },
+    { "WRITE", auth::permission::WRITE  },
+    { "CREATE", auth::permission::CREATE },
+    { "ALTER", auth::permission::ALTER },
+    { "DROP", auth::permission::DROP },
+    { "SELECT", auth::permission::SELECT  },
+    { "MODIFY", auth::permission::MODIFY   },
+    { "AUTHORIZE", auth::permission::AUTHORIZE },
+});
+
+const sstring& auth::permissions::to_string(permission p) {
+    for (auto& v : permission_names) {
+        if (v.second == p) {
+            return v.first;
+        }
+    }
+    throw std::out_of_range("unknown permission");
+}
+
+auth::permission auth::permissions::from_string(const sstring& s) {
+    sstring upper(s);
+    boost::to_upper(upper);
+    return permission_names.at(upper);
+}
+
+std::unordered_set<sstring> auth::permissions::to_strings(const permission_set& set) {
+    std::unordered_set<sstring> res;
+    for (auto& v : permission_names) {
+        if (set.contains(v.second)) {
+            res.emplace(v.first);
+        }
+    }
+    return res;
+}
+
+auth::permission_set auth::permissions::from_strings(const std::unordered_set<sstring>& set) {
+    permission_set res = auth::permissions::NONE;
+    for (auto& s : set) {
+        res.set(from_string(s));
+    }
+    return res;
+}
+
+bool auth::operator<(const permission_set& p1, const permission_set& p2) {
+    return p1.mask() < p2.mask();
+}
--- a/auth/permission.hh
+++ b/auth/permission.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2016 Cloudius Systems
+ * Copyright (C) 2016 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -41,6 +41,9 @@

 #pragma once

+#include <unordered_set>
+#include <seastar/core/sstring.hh>
+
 #include "enum_set.hh"

 namespace auth {
@@ -74,8 +77,22 @@ typedef enum_set<super_enum<permission,
                permission::MODIFY,
                permission::AUTHORIZE>> permission_set;

+bool operator<(const permission_set&, const permission_set&);
+
+namespace permissions {
+
 extern const permission_set ALL_DATA;
 extern const permission_set ALL;
 extern const permission_set NONE;
+extern const permission_set ALTERATIONS;
+
+const sstring& to_string(permission);
+permission from_string(const sstring&);
+
+std::unordered_set<sstring> to_strings(const permission_set&);
+permission_set from_strings(const std::unordered_set<sstring>&);
+
+
+}

 }
--- a/bytes.cc
+++ b/bytes.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2014 Cloudius Systems, Ltd.
+ * Copyright (C) 2014 ScyllaDB
 */

 /*
--- a/bytes.hh
+++ b/bytes.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2015 Cloudius Systems, Ltd.
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/bytes_ostream.hh
+++ b/bytes_ostream.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -38,6 +38,7 @@ class bytes_ostream {
 public:
    using size_type = bytes::size_type;
    using value_type = bytes::value_type;
+    static constexpr size_type max_chunk_size = 16 * 1024;
 private:
    static_assert(sizeof(value_type) == 1, "value_type is assumed to be one byte long");
    struct chunk {
@@ -153,19 +154,18 @@ public:
    }

    bytes_ostream& operator=(const bytes_ostream& o) {
-        _size = 0;
-        _current = nullptr;
-        _begin = {};
-        append(o);
+        if (this != &o) {
+            auto x = bytes_ostream(o);
+            *this = std::move(x);
+        }
        return *this;
    }

    bytes_ostream& operator=(bytes_ostream&& o) noexcept {
-        _size = o._size;
-        _begin = std::move(o._begin);
-        _current = o._current;
-        o._current = nullptr;
-        o._size = 0;
+        if (this != &o) {
+            this->~bytes_ostream();
+            new (this) bytes_ostream(std::move(o));
+        }
        return *this;
    }

@@ -174,7 +174,7 @@ public:
        value_type* ptr;
        // makes the place_holder looks like a stream
        seastar::simple_output_stream get_stream() {
-            return seastar::simple_output_stream{reinterpret_cast<char*>(ptr)};
+            return seastar::simple_output_stream(reinterpret_cast<char*>(ptr), sizeof(T));
        }
    };

@@ -195,19 +195,19 @@ public:
        if (v.empty()) {
            return;
        }
-        auto space_left = current_space_left();
-        if (v.size() <= space_left) {
-            memcpy(_current->data + _current->offset, v.begin(), v.size());
-            _current->offset += v.size();
-            _size += v.size();
-        } else {
-            if (space_left) {
-                memcpy(_current->data + _current->offset, v.begin(), space_left);
-                _current->offset += space_left;
-                _size += space_left;
-                v.remove_prefix(space_left);
-            }
-            memcpy(alloc(v.size()), v.begin(), v.size());
+
+        auto this_size = std::min(v.size(), size_t(current_space_left()));
+        if (this_size) {
+            memcpy(_current->data + _current->offset, v.begin(), this_size);
+            _current->offset += this_size;
+            _size += this_size;
+            v.remove_prefix(this_size);
+        }
+
+        while (!v.empty()) {
+            auto this_size = std::min(v.size(), size_t(max_chunk_size));
+            std::copy_n(v.begin(), this_size, alloc(this_size));
+            v.remove_prefix(this_size);
        }
    }

@@ -272,13 +272,8 @@ public:
    }

    void append(const bytes_ostream& o) {
-        if (o.size() > 0) {
-            auto dst = alloc(o.size());
-            auto r = o._begin.get();
-            while (r) {
-                dst = std::copy_n(r->data, r->offset, dst);
-                r = r->next.get();
-            }
+        for (auto&& bv : o.fragments()) {
+            write(bv);
        }
    }

@@ -328,6 +323,45 @@ public:
        _current->next = nullptr;
        _current->offset = pos._offset;
    }
+
+    void reduce_chunk_count() {
+        // FIXME: This is a simplified version. It linearizes the whole buffer
+        // if its size is below max_chunk_size. We probably could also gain
+        // some read performance by doing "real" reduction, i.e. merging
+        // all chunks until all but the last one is max_chunk_size.
+        if (size() < max_chunk_size) {
+            linearize();
+        }
+    }
+
+    bool operator==(const bytes_ostream& other) const {
+        auto as = fragments().begin();
+        auto as_end = fragments().end();
+        auto bs = other.fragments().begin();
+        auto bs_end = other.fragments().end();
+
+        auto a = *as++;
+        auto b = *bs++;
+        while (!a.empty() || !b.empty()) {
+            auto now = std::min(a.size(), b.size());
+            if (!std::equal(a.begin(), a.begin() + now, b.begin(), b.begin() + now)) {
+                return false;
+            }
+            a.remove_prefix(now);
+            if (a.empty() && as != as_end) {
+                a = *as++;
+            }
+            b.remove_prefix(now);
+            if (b.empty() && bs != bs_end) {
+                b = *bs++;
+            }
+        }
+        return true;
+    }
+
+    bool operator!=(const bytes_ostream& other) const {
+        return !(*this == other);
+    }
 };

 template<>
--- a/caching_options.hh
+++ b/caching_options.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2015 Cloudius Systems, Ltd.
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/cartesian_product.hh
+++ b/cartesian_product.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
 */

--- a/checked-file-impl.hh
+++ b/checked-file-impl.hh
@@ -0,0 +1,151 @@
+/*
+ * Copyright (C) 2016 ScyllaDB
+ */
+
+/*
+ * This file is part of Scylla.
+ *
+ * Scylla is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Scylla is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#pragma once
+
+#include "seastar/core/file.hh"
+#include "disk-error-handler.hh"
+
+class checked_file_impl : public file_impl {
+public:
+
+    checked_file_impl(disk_error_signal_type& s, file f)
+            : _signal(s) , _file(f) {
+        _memory_dma_alignment = f.memory_dma_alignment();
+        _disk_read_dma_alignment = f.disk_read_dma_alignment();
+        _disk_write_dma_alignment = f.disk_write_dma_alignment();
+    }
+
+    virtual future<size_t> write_dma(uint64_t pos, const void* buffer, size_t len, const io_priority_class& pc) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->write_dma(pos, buffer, len, pc);
+        });
+    }
+
+    virtual future<size_t> write_dma(uint64_t pos, std::vector<iovec> iov, const io_priority_class& pc) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->write_dma(pos, iov, pc);
+        });
+    }
+
+    virtual future<size_t> read_dma(uint64_t pos, void* buffer, size_t len, const io_priority_class& pc) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->read_dma(pos, buffer, len, pc);
+        });
+    }
+
+    virtual future<size_t> read_dma(uint64_t pos, std::vector<iovec> iov, const io_priority_class& pc) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->read_dma(pos, iov, pc);
+        });
+    }
+
+    virtual future<> flush(void) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->flush();
+        });
+    }
+
+    virtual future<struct stat> stat(void) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->stat();
+        });
+    }
+
+    virtual future<> truncate(uint64_t length) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->truncate(length);
+        });
+    }
+
+    virtual future<> discard(uint64_t offset, uint64_t length) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->discard(offset, length);
+        });
+    }
+
+    virtual future<> allocate(uint64_t position, uint64_t length) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->allocate(position, length);
+        });
+    }
+
+    virtual future<uint64_t> size(void) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->size();
+        });
+    }
+
+    virtual future<> close() override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->close();
+        });
+    }
+
+    virtual subscription<directory_entry> list_directory(std::function<future<> (directory_entry de)> next) override {
+        return do_io_check(_signal, [&] {
+            return get_file_impl(_file)->list_directory(next);
+        });
+    }
+
+private:
+    disk_error_signal_type &_signal;
+    file _file;
+};
+
+inline file make_checked_file(disk_error_signal_type& signal, file& f)
+{
+    return file(::make_shared<checked_file_impl>(signal, f));
+}
+
+future<file>
+inline open_checked_file_dma(disk_error_signal_type& signal,
+                             sstring name, open_flags flags,
+                             file_open_options options)
+{
+    return do_io_check(signal, [&] {
+        return open_file_dma(name, flags, options).then([&] (file f) {
+            return make_ready_future<file>(make_checked_file(signal, f));
+        });
+    });
+}
+
+future<file>
+inline open_checked_file_dma(disk_error_signal_type& signal,
+                             sstring name, open_flags flags)
+{
+    return do_io_check(signal, [&] {
+        return open_file_dma(name, flags).then([&] (file f) {
+            return make_ready_future<file>(make_checked_file(signal, f));
+        });
+    });
+}
+
+future<file>
+inline open_checked_directory(disk_error_signal_type& signal,
+                              sstring name)
+{
+    return do_io_check(signal, [&] {
+        return engine().open_directory(name).then([&] (file f) {
+            return make_ready_future<file>(make_checked_file(signal, f));
+        });
+    });
+}
--- a/clustering_bounds_comparator.hh
+++ b/clustering_bounds_comparator.hh
@@ -0,0 +1,127 @@
+
+/*
+ * Copyright (C) 2016 ScyllaDB
+ */
+
+/*
+ * This file is part of Scylla.
+ *
+ * Scylla is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Scylla is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#pragma once
+
+#include "keys.hh"
+#include "schema.hh"
+#include "range.hh"
+
+/**
+ * Represents the kind of bound in a range tombstone.
+ */
+enum class bound_kind : uint8_t {
+    excl_end = 0,
+    incl_start = 1,
+    // values 2 to 5 are reserved for forward Origin compatibility
+    incl_end = 6,
+    excl_start = 7,
+};
+
+std::ostream& operator<<(std::ostream& out, const bound_kind k);
+
+bound_kind invert_kind(bound_kind k);
+int32_t weight(bound_kind k);
+
+static inline bound_kind flip_bound_kind(bound_kind bk)
+{
+    switch (bk) {
+    case bound_kind::excl_end: return bound_kind::excl_start;
+    case bound_kind::incl_end: return bound_kind::incl_start;
+    case bound_kind::excl_start: return bound_kind::excl_end;
+    case bound_kind::incl_start: return bound_kind::incl_end;
+    }
+    abort();
+}
+
+class bound_view {
+    const static thread_local clustering_key empty_prefix;
+public:
+    const clustering_key_prefix& prefix;
+    bound_kind kind;
+    bound_view(const clustering_key_prefix& prefix, bound_kind kind)
+        : prefix(prefix)
+        , kind(kind)
+    { }
+    struct compare {
+        // To make it assignable and to avoid taking a schema_ptr, we
+        // wrap the schema reference.
+        std::reference_wrapper<const schema> _s;
+        compare(const schema& s) : _s(s)
+        { }
+        bool operator()(const clustering_key_prefix& p1, int32_t w1, const clustering_key_prefix& p2, int32_t w2) const {
+            auto type = _s.get().clustering_key_prefix_type();
+            auto res = prefix_equality_tri_compare(type->types().begin(),
+                type->begin(p1), type->end(p1),
+                type->begin(p2), type->end(p2),
+                tri_compare);
+            if (res) {
+                return res < 0;
+            }
+            auto d1 = p1.size(_s);
+            auto d2 = p2.size(_s);
+            if (d1 == d2) {
+                return w1 < w2;
+            }
+            return d1 < d2 ? w1 <= 0 : w2 > 0;
+        }
+        bool operator()(const bound_view b, const clustering_key_prefix& p) const {
+            return operator()(b.prefix, weight(b.kind), p, 0);
+        }
+        bool operator()(const clustering_key_prefix& p, const bound_view b) const {
+            return operator()(p, 0, b.prefix, weight(b.kind));
+        }
+        bool operator()(const bound_view b1, const bound_view b2) const {
+            return operator()(b1.prefix, weight(b1.kind), b2.prefix, weight(b2.kind));
+        }
+    };
+    bool equal(const schema& s, const bound_view other) const {
+        return kind == other.kind && prefix.equal(s, other.prefix);
+    }
+    bool adjacent(const schema& s, const bound_view other) const {
+        return invert_kind(other.kind) == kind && prefix.equal(s, other.prefix);
+    }
+    static bound_view bottom() {
+        return {empty_prefix, bound_kind::incl_start};
+    }
+    static bound_view top() {
+        return {empty_prefix, bound_kind::incl_end};
+    }
+    /*
+    template<template<typename> typename T, typename U>
+    concept bool Range() {
+        return requires (T<U> range) {
+            { range.start() } -> stdx::optional<U>;
+            { range.end() } -> stdx::optional<U>;
+        };
+    };*/
+    template<template<typename> typename Range>
+    static std::pair<bound_view, bound_view> from_range(const Range<clustering_key_prefix>& range) {
+        return {
+            range.start() ? bound_view(range.start()->value(), range.start()->is_inclusive() ? bound_kind::incl_start : bound_kind::excl_start) : bottom(),
+            range.end() ? bound_view(range.end()->value(), range.end()->is_inclusive() ? bound_kind::incl_end : bound_kind::excl_end) : top(),
+        };
+    }
+    friend std::ostream& operator<<(std::ostream& out, const bound_view& b) {
+        return out << "{bound: prefix=" << b.prefix << ", kind=" << b.kind << "}";
+    }
+};
--- a/clustering_key_filter.hh
+++ b/clustering_key_filter.hh
@@ -0,0 +1,67 @@
+/*
+ * Copyright (C) 2016 ScyllaDB
+ *
+ * Modified by ScyllaDB
+ */
+
+/*
+ * This file is part of Scylla.
+ *
+ * Scylla is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Scylla is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#pragma once
+
+#include "schema.hh"
+#include "query-request.hh"
+
+namespace query {
+
+class clustering_key_filter_ranges {
+    clustering_row_ranges _storage;
+    const clustering_row_ranges& _ref;
+public:
+    clustering_key_filter_ranges(const clustering_row_ranges& ranges) : _ref(ranges) { }
+    struct reversed { };
+    clustering_key_filter_ranges(reversed, const clustering_row_ranges& ranges)
+        : _storage(ranges.rbegin(), ranges.rend()), _ref(_storage) { }
+
+    clustering_key_filter_ranges(clustering_key_filter_ranges&& other) noexcept
+        : _storage(std::move(other._storage))
+        , _ref(&other._ref == &other._storage ? _storage : other._ref)
+    { }
+
+    clustering_key_filter_ranges& operator=(clustering_key_filter_ranges&& other) noexcept {
+        if (this != &other) {
+            this->~clustering_key_filter_ranges();
+            new (this) clustering_key_filter_ranges(std::move(other));
+        }
+        return *this;
+    }
+
+    auto begin() const { return _ref.begin(); }
+    auto end() const { return _ref.end(); }
+    bool empty() const { return _ref.empty(); }
+    size_t size() const { return _ref.size(); }
+
+    static clustering_key_filter_ranges get_ranges(const schema& schema, const query::partition_slice& slice, const partition_key& key) {
+        const query::clustering_row_ranges& ranges = slice.row_ranges(schema, key);
+        if (slice.options.contains(query::partition_slice::option::reversed)) {
+            return clustering_key_filter_ranges(clustering_key_filter_ranges::reversed{}, ranges);
+        }
+        return clustering_key_filter_ranges(ranges);
+    }
+};
+
+}
--- a/combine.hh
+++ b/combine.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2015 Cloudius Systems, Ltd.
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/compaction_strategy.hh
+++ b/compaction_strategy.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -22,6 +22,8 @@
 #pragma once

 class column_family;
+class schema;
+using schema_ptr = lw_shared_ptr<const schema>;

 namespace sstables {

@@ -30,11 +32,12 @@ enum class compaction_strategy_type {
    major,
    size_tiered,
    leveled,
-    // FIXME: Add support to DateTiered.
+    date_tiered,
 };

 class compaction_strategy_impl;
 class sstable;
+class sstable_set;
 struct compaction_descriptor;

 class compaction_strategy {
@@ -51,6 +54,19 @@ public:
    // Return a list of sstables to be compacted after applying the strategy.
    compaction_descriptor get_sstables_for_compaction(column_family& cfs, std::vector<lw_shared_ptr<sstable>> candidates);

+    // Some strategies may look at the compacted and resulting sstables to
+    // get some useful information for subsequent compactions.
+    void notify_completion(const std::vector<lw_shared_ptr<sstable>>& removed, const std::vector<lw_shared_ptr<sstable>>& added);
+
+    // Return if parallel compaction is allowed by strategy.
+    bool parallel_compaction() const;
+
+    // Return if optimization to rule out sstables based on clustering key filter should be applied.
+    bool use_clustering_key_filter() const;
+
+    // An estimation of number of compaction for strategy to be satisfied.
+    int64_t estimated_pending_compactions(column_family& cf) const;
+
    static sstring name(compaction_strategy_type type) {
        switch (type) {
        case compaction_strategy_type::null:
@@ -61,6 +77,8 @@ public:
            return "SizeTieredCompactionStrategy";
        case compaction_strategy_type::leveled:
            return "LeveledCompactionStrategy";
+        case compaction_strategy_type::date_tiered:
+            return "DateTieredCompactionStrategy";
        default:
            throw std::runtime_error("Invalid Compaction Strategy");
        }
@@ -77,6 +95,8 @@ public:
            return compaction_strategy_type::size_tiered;
        } else if (short_name == "LeveledCompactionStrategy") {
            return compaction_strategy_type::leveled;
+        } else if (short_name == "DateTieredCompactionStrategy") {
+            return compaction_strategy_type::date_tiered;
        } else {
            throw exceptions::configuration_exception(sprint("Unable to find compaction strategy class '%s'", name));
        }
@@ -87,6 +107,8 @@ public:
    sstring name() const {
        return name(type());
    }
+
+    sstable_set make_sstable_set(schema_ptr schema) const;
 };

 // Creates a compaction_strategy object from one of the strategies available.
--- a/compatible_ring_position.hh
+++ b/compatible_ring_position.hh
@@ -0,0 +1,64 @@
+/*
+ * Copyright (C) 2016 ScyllaDB
+ */
+
+/*
+ * This file is part of Scylla.
+ *
+ * Scylla is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Scylla is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+
+#pragma once
+
+#include "query-request.hh"
+#include <experimental/optional>
+
+// Wraps ring_position so it is compatible with old-style C++: default constructor,
+// stateless comparators, yada yada
+class compatible_ring_position {
+    const schema* _schema = nullptr;
+    // optional to supply a default constructor, no more
+    std::experimental::optional<dht::ring_position> _rp;
+public:
+    compatible_ring_position() noexcept = default;
+    compatible_ring_position(const schema& s, const dht::ring_position& rp)
+            : _schema(&s), _rp(rp) {
+    }
+    compatible_ring_position(const schema& s, dht::ring_position&& rp)
+            : _schema(&s), _rp(std::move(rp)) {
+    }
+    friend int tri_compare(const compatible_ring_position& x, const compatible_ring_position& y) {
+        return x._rp->tri_compare(*x._schema, *y._rp);
+    }
+    friend bool operator<(const compatible_ring_position& x, const compatible_ring_position& y) {
+        return tri_compare(x, y) < 0;
+    }
+    friend bool operator<=(const compatible_ring_position& x, const compatible_ring_position& y) {
+        return tri_compare(x, y) <= 0;
+    }
+    friend bool operator>(const compatible_ring_position& x, const compatible_ring_position& y) {
+        return tri_compare(x, y) > 0;
+    }
+    friend bool operator>=(const compatible_ring_position& x, const compatible_ring_position& y) {
+        return tri_compare(x, y) >= 0;
+    }
+    friend bool operator==(const compatible_ring_position& x, const compatible_ring_position& y) {
+        return tri_compare(x, y) == 0;
+    }
+    friend bool operator!=(const compatible_ring_position& x, const compatible_ring_position& y) {
+        return tri_compare(x, y) != 0;
+    }
+};
+
--- a/compound.hh
+++ b/compound.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2015 Cloudius Systems, Ltd.
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/compound_compat.hh
+++ b/compound_compat.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -21,7 +21,10 @@

 #pragma once

+#include <boost/range/algorithm/copy.hpp>
+#include <boost/range/adaptor/transformed.hpp>
 #include "compound.hh"
+#include "schema.hh"

 //
 // This header provides adaptors between the representation used by our compound_type<>
@@ -180,3 +183,348 @@ bytes to_legacy(CompoundType& type, bytes_view packed) {
    std::copy(lv.begin(), lv.end(), legacy_form.begin());
    return legacy_form;
 }
+
+// Represents a value serialized according to Origin's CompositeType.
+// If is_compound is true, then the value is one or more components encoded as:
+//
+//   <representation> ::= ( <component> )+
+//   <component>      ::= <length> <value> <EOC>
+//   <length>         ::= <uint16_t>
+//   <EOC>            ::= <uint8_t>
+//
+// If false, then it encodes a single value, without a prefix length or a suffix EOC.
+class composite final {
+    bytes _bytes;
+    bool _is_compound;
+public:
+    composite(bytes&& b, bool is_compound)
+            : _bytes(std::move(b))
+            , _is_compound(is_compound)
+    { }
+
+    composite(bytes&& b)
+            : _bytes(std::move(b))
+            , _is_compound(true)
+    { }
+
+    composite()
+            : _bytes()
+            , _is_compound(true)
+    { }
+
+    using size_type = uint16_t;
+    using eoc_type = int8_t;
+
+    /*
+     * The 'end-of-component' byte should always be 0 for actual column name.
+     * However, it can set to 1 for query bounds. This allows to query for the
+     * equivalent of 'give me the full range'. That is, if a slice query is:
+     *   start = <3><"foo".getBytes()><0>
+     *   end   = <3><"foo".getBytes()><1>
+     * then we'll return *all* the columns whose first component is "foo".
+     * If for a component, the 'end-of-component' is != 0, there should not be any
+     * following component. The end-of-component can also be -1 to allow
+     * non-inclusive query. For instance:
+     *   end = <3><"foo".getBytes()><-1>
+     * allows to query everything that is smaller than <3><"foo".getBytes()>, but
+     * not <3><"foo".getBytes()> itself.
+     */
+    enum class eoc : eoc_type {
+        start = -1,
+        none = 0,
+        end = 1
+    };
+
+    using component = std::pair<bytes, eoc>;
+    using component_view = std::pair<bytes_view, eoc>;
+private:
+    template<typename Value, typename = std::enable_if_t<!std::is_same<const data_value, std::decay_t<Value>>::value>>
+    static size_t size(Value& val) {
+        return val.size();
+    }
+    static size_t size(const data_value& val) {
+        return val.serialized_size();
+    }
+    template<typename Value, typename = std::enable_if_t<!std::is_same<data_value, std::decay_t<Value>>::value>>
+    static void write_value(Value&& val, bytes::iterator& out) {
+        out = std::copy(val.begin(), val.end(), out);
+    }
+    static void write_value(const data_value& val, bytes::iterator& out) {
+        val.serialize(out);
+    }
+    template<typename RangeOfSerializedComponents>
+    static void serialize_value(RangeOfSerializedComponents&& values, bytes::iterator& out, bool is_compound) {
+        if (!is_compound) {
+            auto it = values.begin();
+            write_value(std::forward<decltype(*it)>(*it), out);
+            return;
+        }
+
+        for (auto&& val : values) {
+            write<size_type>(out, static_cast<size_type>(size(val)));
+            write_value(std::forward<decltype(val)>(val), out);
+            // Range tombstones are not keys. For collections, only frozen
+            // values can be keys. Therefore, for as long as it is safe to
+            // assume that this code will be used to create keys, it is safe
+            // to assume the trailing byte is always zero.
+            write<eoc_type>(out, eoc_type(eoc::none));
+        }
+    }
+    template <typename RangeOfSerializedComponents>
+    static size_t serialized_size(RangeOfSerializedComponents&& values, bool is_compound) {
+        size_t len = 0;
+        auto it = values.begin();
+        if (it != values.end()) {
+            // CQL3 uses a specific prefix (0xFFFF) to encode "static columns"
+            // (CASSANDRA-6561). This does mean the maximum size of the first component of a
+            // composite is 65534, not 65535 (or we wouldn't be able to detect if the first 2
+            // bytes is the static prefix or not).
+            auto value_size = size(*it);
+            if (value_size > static_cast<size_type>(std::numeric_limits<size_type>::max() - uint8_t(is_compound))) {
+                throw std::runtime_error(sprint("First component size too large: %d > %d", value_size, std::numeric_limits<size_type>::max() - is_compound));
+            }
+            if (!is_compound) {
+                return value_size;
+            }
+            len += sizeof(size_type) + value_size + sizeof(eoc_type);
+            ++it;
+        }
+        for ( ; it != values.end(); ++it) {
+            auto value_size = size(*it);
+            if (value_size > std::numeric_limits<size_type>::max()) {
+                throw std::runtime_error(sprint("Component size too large: %d > %d", value_size, std::numeric_limits<size_type>::max()));
+            }
+            len += sizeof(size_type) + value_size + sizeof(eoc_type);
+        }
+        return len;
+    }
+public:
+    template <typename Describer>
+    auto describe_type(Describer f) const {
+        return f(const_cast<bytes&>(_bytes));
+    }
+
+    template<typename RangeOfSerializedComponents>
+    static bytes serialize_value(RangeOfSerializedComponents&& values, bool is_compound = true) {
+        auto size = serialized_size(values, is_compound);
+        bytes b(bytes::initialized_later(), size);
+        auto i = b.begin();
+        serialize_value(std::forward<decltype(values)>(values), i, is_compound);
+        return b;
+    }
+
+    class iterator : public std::iterator<std::input_iterator_tag, const component_view> {
+        bytes_view _v;
+        component_view _current;
+    private:
+        eoc to_eoc(int8_t eoc_byte) {
+            return eoc_byte == 0 ? eoc::none : (eoc_byte < 0 ? eoc::start : eoc::end);
+        }
+
+        void read_current() {
+            size_type len;
+            {
+                if (_v.empty()) {
+                    _v = bytes_view(nullptr, 0);
+                    return;
+                }
+                len = read_simple<size_type>(_v);
+                if (_v.size() < len) {
+                    throw marshal_exception();
+                }
+            }
+            auto value = bytes_view(_v.begin(), len);
+            _v.remove_prefix(len);
+            _current = component_view(std::move(value), to_eoc(read_simple<eoc_type>(_v)));
+        }
+    public:
+        struct end_iterator_tag {};
+
+        iterator(const bytes_view& v, bool is_compound, bool is_static)
+                : _v(v) {
+            if (is_static) {
+                _v.remove_prefix(2);
+            }
+            if (is_compound) {
+                read_current();
+            } else {
+                _current = component_view(_v, eoc::none);
+                _v.remove_prefix(_v.size());
+            }
+        }
+
+        iterator(end_iterator_tag) : _v(nullptr, 0) {}
+
+        iterator& operator++() {
+            read_current();
+            return *this;
+        }
+
+        iterator operator++(int) {
+            iterator i(*this);
+            ++(*this);
+            return i;
+        }
+
+        const value_type& operator*() const { return _current; }
+        const value_type* operator->() const { return &_current; }
+        bool operator!=(const iterator& i) const { return _v.begin() != i._v.begin(); }
+        bool operator==(const iterator& i) const { return _v.begin() == i._v.begin(); }
+    };
+
+    iterator begin() const {
+        return iterator(_bytes, _is_compound, is_static());
+    }
+
+    iterator end() const {
+        return iterator(iterator::end_iterator_tag());
+    }
+
+    boost::iterator_range<iterator> components() const & {
+        return { begin(), end() };
+    }
+
+    auto values() const & {
+        return components() | boost::adaptors::transformed([](auto&& c) { return c.first; });
+    }
+
+    std::vector<component> components() const && {
+        std::vector<component> result;
+        std::transform(begin(), end(), std::back_inserter(result), [](auto&& p) {
+            return component(bytes(p.first.begin(), p.first.end()), p.second);
+        });
+        return result;
+    }
+
+    std::vector<bytes> values() const && {
+        std::vector<bytes> result;
+        boost::copy(components() | boost::adaptors::transformed([](auto&& c) { return to_bytes(c.first); }), std::back_inserter(result));
+        return result;
+    }
+
+    const bytes& get_bytes() const {
+        return _bytes;
+    }
+
+    size_t size() const {
+        return _bytes.size();
+    }
+
+    bool empty() const {
+        return _bytes.empty();
+    }
+
+    static bool is_static(bytes_view bytes, bool is_compound) {
+        return is_compound && bytes.size() > 2 && (bytes[0] & bytes[1] & 0xff) == 0xff;
+    }
+
+    bool is_static() const {
+        return is_static(_bytes, _is_compound);
+    }
+
+    bool is_compound() const {
+        return _is_compound;
+    }
+
+    // The following factory functions assume this composite is a compound value.
+    template <typename ClusteringElement>
+    static composite from_clustering_element(const schema& s, const ClusteringElement& ce) {
+        return serialize_value(ce.components(s));
+    }
+
+    static composite from_exploded(const std::vector<bytes_view>& v, eoc marker = eoc::none) {
+        if (v.size() == 0) {
+            return bytes(size_t(1), bytes::value_type(marker));
+        }
+        auto b = serialize_value(v);
+        b.back() = eoc_type(marker);
+        return composite(std::move(b));
+    }
+
+    static composite static_prefix(const schema& s) {
+        static bytes static_marker(size_t(2), bytes::value_type(0xff));
+
+        std::vector<bytes_view> sv(s.clustering_key_size());
+        return static_marker + serialize_value(sv);
+    }
+
+    explicit operator bytes_view() const {
+        return _bytes;
+    }
+
+    template <typename Component>
+    friend inline std::ostream& operator<<(std::ostream& os, const std::pair<Component, eoc>& c) {
+        return os << "{value=" << c.first << "; eoc=" << sprint("0x%02x", eoc_type(c.second) & 0xff) << "}";
+    }
+};
+
+class composite_view final {
+    bytes_view _bytes;
+    bool _is_compound;
+public:
+    composite_view(bytes_view b, bool is_compound = true)
+            : _bytes(b)
+            , _is_compound(is_compound)
+    { }
+
+    composite_view(const composite& c)
+            : composite_view(static_cast<bytes_view>(c), c.is_compound())
+    { }
+
+    composite_view()
+            : _bytes(nullptr, 0)
+            , _is_compound(true)
+    { }
+
+    std::vector<bytes> explode() const {
+        if (!_is_compound) {
+            return { to_bytes(_bytes) };
+        }
+
+        std::vector<bytes> ret;
+        for (auto it = begin(), e = end(); it != e; ) {
+            ret.push_back(to_bytes(it->first));
+            auto marker = it->second;
+            ++it;
+            if (it != e && marker != composite::eoc::none) {
+                throw runtime_exception(sprint("non-zero component divider found (%d) mid", sprint("0x%02x", composite::eoc_type(marker) & 0xff)));
+            }
+        }
+        return ret;
+    }
+
+    composite::iterator begin() const {
+        return composite::iterator(_bytes, _is_compound, is_static());
+    }
+
+    composite::iterator end() const {
+        return composite::iterator(composite::iterator::end_iterator_tag());
+    }
+
+    boost::iterator_range<composite::iterator> components() const {
+        return { begin(), end() };
+    }
+
+    auto values() const {
+        return components() | boost::adaptors::transformed([](auto&& c) { return c.first; });
+    }
+
+    size_t size() const {
+        return _bytes.size();
+    }
+
+    bool empty() const {
+        return _bytes.empty();
+    }
+
+    bool is_static() const {
+        return composite::is_static(_bytes, _is_compound);
+    }
+
+    explicit operator bytes_view() const {
+        return _bytes;
+    }
+
+    bool operator==(const composite_view& k) const { return k._bytes == _bytes && k._is_compound == _is_compound; }
+    bool operator!=(const composite_view& k) const { return !(k == *this); }
+};
--- a/compress.hh
+++ b/compress.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2015 Cloudius Systems, Ltd.
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -32,7 +32,7 @@ enum class compressor {

 class compression_parameters {
 public:
-    static constexpr int32_t DEFAULT_CHUNK_LENGTH = 64 * 1024;
+    static constexpr int32_t DEFAULT_CHUNK_LENGTH = 4 * 1024;
    static constexpr double DEFAULT_CRC_CHECK_CHANCE = 1.0;

    static constexpr auto SSTABLE_COMPRESSION = "sstable_compression";
--- a/conf/housekeeping.cfg
+++ b/conf/housekeeping.cfg
@@ -0,0 +1,2 @@
+[housekeeping]
+check-version: True
--- a/conf/scylla.yaml
+++ b/conf/scylla.yaml
@@ -106,6 +106,19 @@ write_request_timeout_in_ms: 2000
 # most users should never need to adjust this.
 # phi_convict_threshold: 8

+# IEndpointSnitch.  The snitch has two functions:
+# - it teaches Scylla enough about your network topology to route
+#   requests efficiently
+# - it allows Scylla to spread replicas around your cluster to avoid
+#   correlated failures. It does this by grouping machines into
+#   "datacenters" and "racks."  Scylla will do its best not to have
+#   more than one replica on the same "rack" (which may not actually
+#   be a physical location)
+#
+# IF YOU CHANGE THE SNITCH AFTER DATA IS INSERTED INTO THE CLUSTER,
+# YOU MUST RUN A FULL REPAIR, SINCE THE SNITCH AFFECTS WHERE REPLICAS
+# ARE PLACED.
+#
 # Out of the box, Scylla provides
 #  - SimpleSnitch:
 #    Treats Strategy order as proximity. This can improve cache
@@ -179,10 +192,24 @@ api_address: 127.0.0.1
 # Caution should be taken on increasing the size of this threshold as it can lead to node instability.
 batch_size_warn_threshold_in_kb: 5

+# Authentication backend, identifying users
+# Out of the box, Scylla provides org.apache.cassandra.auth.{AllowAllAuthenticator,
+# PasswordAuthenticator}.
+#
+# - AllowAllAuthenticator performs no checks - set it to disable authentication.
+# - PasswordAuthenticator relies on username/password pairs to authenticate
+#   users. It keeps usernames and hashed passwords in system_auth.credentials table.
+#   Please increase system_auth keyspace replication factor if you use this authenticator.
+# authenticator: AllowAllAuthenticator

-###################################################
-## Not currently supported, reserved for future use
-###################################################
+# Authorization backend, implementing IAuthorizer; used to limit access/provide permissions
+# Out of the box, Scylla provides org.apache.cassandra.auth.{AllowAllAuthorizer,
+# CassandraAuthorizer}.
+#
+# - AllowAllAuthorizer allows any action to any user - set it to disable authorization.
+# - CassandraAuthorizer stores permissions in system_auth.permissions table. Please
+#   increase system_auth keyspace replication factor if you use this authorizer.
+# authorizer: AllowAllAuthorizer

 # initial_token allows you to specify tokens manually.  While you can use # it with
 # vnodes (num_tokens > 1, above) -- in which case you should provide a 
@@ -190,6 +217,10 @@ batch_size_warn_threshold_in_kb: 5
 # that do not have vnodes enabled.
 # initial_token:

+###################################################
+## Not currently supported, reserved for future use
+###################################################
+
 # See http://wiki.apache.org/cassandra/HintedHandoff
 # May either be "true" or "false" to enable globally, or contain a list
 # of data centers to enable per-datacenter.
@@ -216,25 +247,6 @@ batch_size_warn_threshold_in_kb: 5
 # reduced proportionally to the number of nodes in the cluster.
 # batchlog_replay_throttle_in_kb: 1024

-# Authentication backend, identifying users
-# Out of the box, Scylla provides org.apache.cassandra.auth.{AllowAllAuthenticator,
-# PasswordAuthenticator}.
-#
-# - AllowAllAuthenticator performs no checks - set it to disable authentication.
-# - PasswordAuthenticator relies on username/password pairs to authenticate
-#   users. It keeps usernames and hashed passwords in system_auth.credentials table.
-#   Please increase system_auth keyspace replication factor if you use this authenticator.
-# authenticator: AllowAllAuthenticator
-
-# Authorization backend, implementing IAuthorizer; used to limit access/provide permissions
-# Out of the box, Scylla provides org.apache.cassandra.auth.{AllowAllAuthorizer,
-# CassandraAuthorizer}.
-#
-# - AllowAllAuthorizer allows any action to any user - set it to disable authorization.
-# - CassandraAuthorizer stores permissions in system_auth.permissions table. Please
-#   increase system_auth keyspace replication factor if you use this authorizer.
-# authorizer: AllowAllAuthorizer
-
 # Validity period for permissions cache (fetching permissions can be an
 # expensive operation depending on the authorizer, CassandraAuthorizer is
 # one example). Defaults to 2000, set to 0 to disable.
@@ -680,58 +692,6 @@ commitlog_total_space_in_mb: -1
 # Default value is 0, which never timeout streams.
 # streaming_socket_timeout_in_ms: 0

-
-# endpoint_snitch -- Set this to a class that implements
-# IEndpointSnitch.  The snitch has two functions:
-# - it teaches Scylla enough about your network topology to route
-#   requests efficiently
-# - it allows Scylla to spread replicas around your cluster to avoid
-#   correlated failures. It does this by grouping machines into
-#   "datacenters" and "racks."  Scylla will do its best not to have
-#   more than one replica on the same "rack" (which may not actually
-#   be a physical location)
-#
-# IF YOU CHANGE THE SNITCH AFTER DATA IS INSERTED INTO THE CLUSTER,
-# YOU MUST RUN A FULL REPAIR, SINCE THE SNITCH AFFECTS WHERE REPLICAS
-# ARE PLACED.
-#
-# Out of the box, Scylla provides
-#  - SimpleSnitch:
-#    Treats Strategy order as proximity. This can improve cache
-#    locality when disabling read repair.  Only appropriate for
-#    single-datacenter deployments.
-#  - GossipingPropertyFileSnitch
-#    This should be your go-to snitch for production use.  The rack
-#    and datacenter for the local node are defined in
-#    cassandra-rackdc.properties and propagated to other nodes via
-#    gossip.  If cassandra-topology.properties exists, it is used as a
-#    fallback, allowing migration from the PropertyFileSnitch.
-#  - PropertyFileSnitch:
-#    Proximity is determined by rack and data center, which are
-#    explicitly configured in cassandra-topology.properties.
-#  - Ec2Snitch:
-#    Appropriate for EC2 deployments in a single Region. Loads Region
-#    and Availability Zone information from the EC2 API. The Region is
-#    treated as the datacenter, and the Availability Zone as the rack.
-#    Only private IPs are used, so this will not work across multiple
-#    Regions.
-#  - Ec2MultiRegionSnitch:
-#    Uses public IPs as broadcast_address to allow cross-region
-#    connectivity.  (Thus, you should set seed addresses to the public
-#    IP as well.) You will need to open the storage_port or
-#    ssl_storage_port on the public IP firewall.  (For intra-Region
-#    traffic, Scylla will switch to the private IP after
-#    establishing a connection.)
-#  - RackInferringSnitch:
-#    Proximity is determined by rack and data center, which are
-#    assumed to correspond to the 3rd and 2nd octet of each node's IP
-#    address, respectively.  Unless this happens to match your
-#    deployment conventions, this is best used as an example of
-#    writing a custom Snitch class and is provided in that spirit.
-#
-# You can use a custom Snitch by setting this to the full class name
-# of the snitch, which will be assumed to be on your classpath.
-
 # controls how often to perform the more expensive part of host score
 # calculation
 # dynamic_snitch_update_interval_in_ms: 100 
@@ -824,7 +784,7 @@ commitlog_total_space_in_mb: -1
 # can be:  all  - all traffic is compressed
 #          dc   - traffic between different datacenters is compressed
 #          none - nothing is compressed.
-# internode_compression: all
+# internode_compression: none

 # Enable or disable tcp_nodelay for inter-dc communication.
 # Disabling it will result in larger (but fewer) network packets being sent,
@@ -845,3 +805,21 @@ commitlog_total_space_in_mb: -1
 # true: relaxed environment checks; performance and reliability may degraade.
 #
 # developer_mode: false
+
+
+# Idle-time background processing
+#
+# Scylla can perform certain jobs in the background while the system is otherwise idle,
+# freeing processor resources when there is other work to be done.
+#
+# defragment_memory_on_idle: true
+#
+# prometheus port
+# By default, Scylla opens prometheus API port on port 9180
+# setting the port to 0 will disable the prometheus API.
+# prometheus_port: 9180
+#
+# prometheus address
+# By default, Scylla binds all interfaces to the prometheus API
+# It is possible to restrict the listening address to a specific one
+# prometheus_address: 0.0.0.0
--- a/configure.py
+++ b/configure.py
@@ -1,6 +1,6 @@
 #!/usr/bin/python3
 #
-# Copyright 2015 Cloudius Systems
+# Copyright (C) 2015 ScyllaDB
 #

 #
@@ -162,6 +162,8 @@ modes = {

 scylla_tests = [
    'tests/mutation_test',
+    'tests/streamed_mutation_test',
+    'tests/schema_registry_test',
    'tests/canonical_mutation_test',
    'tests/range_test',
    'tests/types_test',
@@ -215,6 +217,12 @@ scylla_tests = [
    'tests/dynamic_bitset_test',
    'tests/auth_test',
    'tests/idl_test',
+    'tests/range_tombstone_list_test',
+    'tests/anchorless_list_test',
+    'tests/database_test',
+    'tests/nonwrapping_range_test',
+    'tests/input_stream_test',
+    'tests/sstable_atomic_deletion_test',
 ]

 apps = [
@@ -255,6 +263,8 @@ arg_parser.add_argument('--debuginfo', action = 'store', dest = 'debuginfo', typ
                        help = 'Enable(1)/disable(0)compiler debug information generation')
 arg_parser.add_argument('--static-stdc++', dest = 'staticcxx', action = 'store_true',
 			help = 'Link libgcc and libstdc++ statically')
+arg_parser.add_argument('--static-thrift', dest = 'staticthrift', action = 'store_true',
+			help = 'Link libthrift statically')
 arg_parser.add_argument('--tests-debuginfo', action = 'store', dest = 'tests_debuginfo', type = int, default = 0,
                        help = 'Enable(1)/disable(0)compiler debug information generation for tests')
 arg_parser.add_argument('--python', action = 'store', dest = 'python', default = 'python3',
@@ -275,6 +285,8 @@ scylla_core = (['database.cc',
                 'schema_registry.cc',
                 'bytes.cc',
                 'mutation.cc',
+                 'streamed_mutation.cc',
+                 'partition_version.cc',
                 'row_cache.cc',
                 'canonical_mutation.cc',
                 'frozen_mutation.cc',
@@ -293,12 +305,12 @@ scylla_core = (['database.cc',
                 'sstables/sstables.cc',
                 'sstables/compress.cc',
                 'sstables/row.cc',
-                 'sstables/key.cc',
                 'sstables/partition.cc',
                 'sstables/filter.cc',
                 'sstables/compaction.cc',
+                 'sstables/compaction_strategy.cc',
                 'sstables/compaction_manager.cc',
-                 'log.cc',
+                 'sstables/atomic_deletion.cc',
                 'transport/event.cc',
                 'transport/event_notifier.cc',
                 'transport/server.cc',
@@ -315,11 +327,14 @@ scylla_core = (['database.cc',
                 'cql3/functions/functions.cc',
                 'cql3/statements/cf_prop_defs.cc',
                 'cql3/statements/cf_statement.cc',
+                 'cql3/statements/authentication_statement.cc',
                 'cql3/statements/create_keyspace_statement.cc',
                 'cql3/statements/create_table_statement.cc',
                 'cql3/statements/create_type_statement.cc',
+                 'cql3/statements/create_user_statement.cc',
                 'cql3/statements/drop_keyspace_statement.cc',
                 'cql3/statements/drop_table_statement.cc',
+                 'cql3/statements/drop_type_statement.cc',
                 'cql3/statements/schema_altering_statement.cc',
                 'cql3/statements/ks_prop_defs.cc',
                 'cql3/statements/modification_statement.cc',
@@ -335,8 +350,19 @@ scylla_core = (['database.cc',
                 'cql3/statements/create_index_statement.cc',
                 'cql3/statements/truncate_statement.cc',
                 'cql3/statements/alter_table_statement.cc',
+                 'cql3/statements/alter_user_statement.cc',
+                 'cql3/statements/drop_user_statement.cc',
+                 'cql3/statements/list_users_statement.cc',
+                 'cql3/statements/authorization_statement.cc',
+                 'cql3/statements/permission_altering_statement.cc',
+                 'cql3/statements/list_permissions_statement.cc',
+                 'cql3/statements/grant_statement.cc',
+                 'cql3/statements/revoke_statement.cc',
+                 'cql3/statements/alter_type_statement.cc',
+                 'cql3/statements/alter_keyspace_statement.cc',
                 'cql3/update_parameters.cc',
                 'cql3/ut_name.cc',
+                 'cql3/user_options.cc',
                 'thrift/handler.cc',
                 'thrift/server.cc',
                 'thrift/thrift_validation.cc',
@@ -352,6 +378,7 @@ scylla_core = (['database.cc',
                 'cql3/operator.cc',
                 'cql3/relation.cc',
                 'cql3/column_identifier.cc',
+                 'cql3/column_specification.cc',
                 'cql3/constants.cc',
                 'cql3/query_processor.cc',
                 'cql3/query_options.cc',
@@ -367,6 +394,7 @@ scylla_core = (['database.cc',
                 'cql3/selection/selection.cc',
                 'cql3/selection/selector.cc',
                 'cql3/restrictions/statement_restrictions.cc',
+                 'cql3/result_set.cc',
                 'db/consistency_level.cc',
                 'db/system_keyspace.cc',
                 'db/schema_tables.cc',
@@ -387,6 +415,7 @@ scylla_core = (['database.cc',
                 'utils/file_lock.cc',
                 'utils/dynamic_bitset.cc',
                 'utils/managed_bytes.cc',
+                 'utils/exceptions.cc',
                 'gms/version_generator.cc',
                 'gms/versioned_value.cc',
                 'gms/gossiper.cc',
@@ -399,6 +428,7 @@ scylla_core = (['database.cc',
                 'dht/i_partitioner.cc',
                 'dht/murmur3_partitioner.cc',
                 'dht/byte_ordered_partitioner.cc',
+                 'dht/random_partitioner.cc',
                 'dht/boot_strapper.cc',
                 'dht/range_streamer.cc',
                 'unimplemented.cc',
@@ -447,9 +477,17 @@ scylla_core = (['database.cc',
                 'auth/auth.cc',
                 'auth/authenticated_user.cc',
                 'auth/authenticator.cc',
+                 'auth/authorizer.cc',
+                 'auth/default_authorizer.cc',
                 'auth/data_resource.cc',
                 'auth/password_authenticator.cc',
                 'auth/permission.cc',
+                 'tracing/tracing.cc',
+                 'tracing/trace_keyspace_helper.cc',
+                 'tracing/trace_state.cc',
+                 'range_tombstone.cc',
+                 'range_tombstone_list.cc',
+                 'db/size_estimates_recorder.cc'
                 ]
                + [Antlr3Grammar('cql3/Cql.g')]
                + [Thrift('interface/cassandra.thrift', 'Cassandra')]
@@ -509,6 +547,7 @@ idls = ['idl/gossip_digest.idl.hh',
        'idl/query.idl.hh',
        'idl/idl_test.idl.hh',
        'idl/commitlog.idl.hh',
+        'idl/tracing.idl.hh',
        ]

 scylla_tests_dependencies = scylla_core + api + idls + [
@@ -531,8 +570,6 @@ tests_not_using_seastar_test_framework = set([
    'tests/keys_test',
    'tests/partitioner_test',
    'tests/map_difference_test',
-    'tests/frozen_mutation_test',
-    'tests/canonical_mutation_test',
    'tests/perf/perf_mutation',
    'tests/lsa_async_eviction_test',
    'tests/lsa_sync_eviction_test',
@@ -553,6 +590,9 @@ tests_not_using_seastar_test_framework = set([
    'tests/managed_vector_test',
    'tests/dynamic_bitset_test',
    'tests/idl_test',
+    'tests/range_tombstone_list_test',
+    'tests/anchorless_list_test',
+    'tests/nonwrapping_range_test',
 ])

 for t in tests_not_using_seastar_test_framework:
@@ -567,9 +607,11 @@ for t in scylla_tests:
 deps['tests/sstable_test'] += ['tests/sstable_datafile_test.cc']

 deps['tests/bytes_ostream_test'] = ['tests/bytes_ostream_test.cc']
+deps['tests/input_stream_test'] = ['tests/input_stream_test.cc']
 deps['tests/UUID_test'] = ['utils/UUID_gen.cc', 'tests/UUID_test.cc']
 deps['tests/murmur_hash_test'] = ['bytes.cc', 'utils/murmur_hash.cc', 'tests/murmur_hash_test.cc']
-deps['tests/allocation_strategy_test'] = ['tests/allocation_strategy_test.cc', 'utils/logalloc.cc', 'log.cc', 'utils/dynamic_bitset.cc']
+deps['tests/allocation_strategy_test'] = ['tests/allocation_strategy_test.cc', 'utils/logalloc.cc', 'utils/dynamic_bitset.cc']
+deps['tests/anchorless_list_test'] = ['tests/anchorless_list_test.cc']

 warnings = [
    '-Wno-mismatched-tags',  # clang-only
@@ -705,6 +747,10 @@ user_cflags = args.user_cflags
 user_ldflags = args.user_ldflags
 if args.staticcxx:
    user_ldflags += " -static-libgcc -static-libstdc++"
+if args.staticthrift:
+    thrift_libs = "-Wl,-Bstatic -lthrift -Wl,-Bdynamic"
+else:
+    thrift_libs = "-lthrift"

 outdir = 'build'
 buildfile = 'build.ninja'
@@ -815,14 +861,14 @@ with open(buildfile, 'w') as f:
                    f.write('build $builddir/{}/{}: {}.{} {} {}\n'.format(mode, binary, tests_link_rule, mode, str.join(' ', objs),
                                                                                     'seastar/build/{}/libseastar.a'.format(mode)))
                    if has_thrift:
-                        f.write('   libs =  -lthrift -lboost_system $libs\n')
+                        f.write('   libs =  {} -lboost_system $libs\n'.format(thrift_libs))
                    f.write('build $builddir/{}/{}_g: link.{} {} {}\n'.format(mode, binary, mode, str.join(' ', objs),
                                                                              'seastar/build/{}/libseastar.a'.format(mode)))
                else:
                    f.write('build $builddir/{}/{}: link.{} {} {}\n'.format(mode, binary, mode, str.join(' ', objs),
                                                                            'seastar/build/{}/libseastar.a'.format(mode)))
                if has_thrift:
-                    f.write('   libs =  -lthrift -lboost_system $libs\n')
+                    f.write('   libs =  {} -lboost_system $libs\n'.format(thrift_libs))
            for src in srcs:
                if src.endswith('.cc'):
                    obj = '$builddir/' + mode + '/' + src.replace('.cc', '.o')
@@ -845,8 +891,8 @@ with open(buildfile, 'w') as f:
        for obj in compiles:
            src = compiles[obj]
            gen_headers = list(ragels.keys())
-            gen_headers += ['seastar/build/{}/http/request_parser.hh'.format(mode)]
-            gen_headers += ['seastar/build/{}/http/http_response_parser.hh'.format(mode)]
+            gen_headers += ['seastar/build/{}/gen/http/request_parser.hh'.format(mode)]
+            gen_headers += ['seastar/build/{}/gen/http/http_response_parser.hh'.format(mode)]
            for th in thrifts:
                gen_headers += th.headers('$builddir/{}/gen'.format(mode))
            for g in antlr3_grammars:
@@ -878,10 +924,10 @@ with open(buildfile, 'w') as f:
            for cc in grammar.sources('$builddir/{}/gen'.format(mode)):
                obj = cc.replace('.cpp', '.o')
                f.write('build {}: cxx.{} {} || {}\n'.format(obj, mode, cc, ' '.join(serializers)))
-        f.write('build seastar/build/{mode}/libseastar.a seastar/build/{mode}/apps/iotune/iotune: ninja {seastar_deps}\n'
+        f.write('build seastar/build/{mode}/libseastar.a seastar/build/{mode}/apps/iotune/iotune seastar/build/{mode}/gen/http/request_parser.hh seastar/build/{mode}/gen/http/http_response_parser.hh: ninja {seastar_deps}\n'
                .format(**locals()))
        f.write('  subdir = seastar\n')
-        f.write('  target = build/{mode}/libseastar.a build/{mode}/apps/iotune/iotune\n'.format(**locals()))
+        f.write('  target = build/{mode}/libseastar.a build/{mode}/apps/iotune/iotune build/{mode}/gen/http/request_parser.hh build/{mode}/gen/http/http_response_parser.hh\n'.format(**locals()))
        f.write(textwrap.dedent('''\
            build build/{mode}/iotune: copy seastar/build/{mode}/apps/iotune/iotune
            ''').format(**locals()))
@@ -895,14 +941,6 @@ with open(buildfile, 'w') as f:
            command = find -name '*.[chS]' -o -name "*.cc" -o -name "*.hh" | cscope -bq -i-
            description = CSCOPE
        build cscope: cscope
-        rule request_parser_hh
-           command = {ninja} -C seastar build/release/gen/http/request_parser.hh build/debug/gen/http/request_parser.hh
-           description = GEN seastar/http/request_parser.hh
-        build seastar/build/release/http/request_parser.hh seastar/build/debug/http/request_parser.hh: request_parser_hh
-        rule http_response_parser_hh
-           command = {ninja} -C seastar build/release/gen/http/http_response_parser.hh build/debug/gen/http/http_response_parser.hh
-           description = GEN seastar/http/http_response_parser.hh
-        build seastar/build/release/http/http_response_parser.hh seastar/build/debug/http/http_response_parser.hh: http_response_parser_hh
        rule clean
            command = rm -rf build
            description = CLEAN
--- a/converting_mutation_partition_applier.hh
+++ b/converting_mutation_partition_applier.hh
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2015 Cloudius Systems, Ltd.
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
@@ -35,7 +35,7 @@ class converting_mutation_partition_applier : public mutation_partition_visitor
    deletable_row* _current_row;
 private:
    static bool is_compatible(const column_definition& new_def, const data_type& old_type, column_kind kind) {
-        return new_def.kind == kind && new_def.type->is_value_compatible_with(*old_type);
+        return ::is_compatible(new_def.kind, kind) && new_def.type->is_value_compatible_with(*old_type);
    }
    void accept_cell(row& dst, column_kind kind, const column_definition& new_def, const data_type& old_type, atomic_cell_view cell) {
        if (is_compatible(new_def, old_type, kind) && cell.timestamp() > new_def.dropped_at()) {
@@ -90,8 +90,8 @@ public:
        }
    }

-    virtual void accept_row_tombstone(clustering_key_prefix_view prefix, tombstone t) override {
-        _p.apply_row_tombstone(_p_schema, prefix, t);
+    virtual void accept_row_tombstone(const range_tombstone& rt) override {
+        _p.apply_row_tombstone(_p_schema, rt);
    }

    virtual void accept_row(clustering_key_view key, tombstone deleted_at, const row_marker& rm) override {
--- a/cql3/Cql.g
+++ b/cql3/Cql.g
@@ -26,26 +26,39 @@ options {
@parser::namespace{cql3_parser}

@lexer::includes {
+#include "cql3/error_collector.hh"
 #include "cql3/error_listener.hh"
 }

@parser::includes {
 #include "cql3/selection/writetime_or_ttl.hh"
+#include "cql3/statements/raw/parsed_statement.hh"
+#include "cql3/statements/raw/select_statement.hh"
+#include "cql3/statements/alter_keyspace_statement.hh"
 #include "cql3/statements/alter_table_statement.hh"
 #include "cql3/statements/create_keyspace_statement.hh"
 #include "cql3/statements/drop_keyspace_statement.hh"
 #include "cql3/statements/create_index_statement.hh"
 #include "cql3/statements/create_table_statement.hh"
 #include "cql3/statements/create_type_statement.hh"
+#include "cql3/statements/drop_type_statement.hh"
+#include "cql3/statements/alter_type_statement.hh"
 #include "cql3/statements/property_definitions.hh"
 #include "cql3/statements/drop_table_statement.hh"
 #include "cql3/statements/truncate_statement.hh"
-#include "cql3/statements/select_statement.hh"
-#include "cql3/statements/update_statement.hh"
-#include "cql3/statements/delete_statement.hh"
+#include "cql3/statements/raw/update_statement.hh"
+#include "cql3/statements/raw/insert_statement.hh"
+#include "cql3/statements/raw/delete_statement.hh"
 #include "cql3/statements/index_prop_defs.hh"
-#include "cql3/statements/use_statement.hh"
-#include "cql3/statements/batch_statement.hh"
+#include "cql3/statements/raw/use_statement.hh"
+#include "cql3/statements/raw/batch_statement.hh"
+#include "cql3/statements/create_user_statement.hh"
+#include "cql3/statements/alter_user_statement.hh"
+#include "cql3/statements/drop_user_statement.hh"
+#include "cql3/statements/list_users_statement.hh"
+#include "cql3/statements/grant_statement.hh"
+#include "cql3/statements/revoke_statement.hh"
+#include "cql3/statements/list_permissions_statement.hh"
 #include "cql3/statements/index_target.hh"
 #include "cql3/statements/ks_prop_defs.hh"
 #include "cql3/selection/raw_selector.hh"
@@ -108,10 +121,13 @@ struct uninitialized {
 }

@context {
-    using listener_type = cql3::error_listener<RecognizerType>;
+    using collector_type = cql3::error_collector<ComponentType, ExceptionBaseType::TokenType, ExceptionBaseType>;
+    using listener_type = cql3::error_listener<ComponentType, ExceptionBaseType>;
+
    listener_type* listener;

    std::vector<::shared_ptr<cql3::column_identifier>> _bind_variables;
+    std::vector<std::unique_ptr<TokenType>> _missing_tokens;

    // Can't use static variable, since it needs to be defined out-of-line
    static const std::unordered_set<sstring>& _reserved_type_names() {
@@ -161,15 +177,26 @@ struct uninitialized {

    void displayRecognitionError(ANTLR_UINT8** token_names, ExceptionBaseType* ex)
    {
-        std::stringstream msg;
-        ex->displayRecognitionError(token_names, msg);
-        listener->syntax_error(*this, msg.str());
+        listener->syntax_error(*this, token_names, ex);
    }

    void add_recognition_error(const sstring& msg) {
        listener->syntax_error(*this, msg);
    }

+    bool is_eof_token(CommonTokenType token) const
+    {
+        return token == CommonTokenType::TOKEN_EOF;
+    }
+
+    std::string token_text(const TokenType* token)
+    {
+        if (!token) {
+            return "";
+        }
+        return token->getText();
+    }
+
    std::map<sstring, sstring> convert_property_map(shared_ptr<cql3::maps::literal> map) {
        if (!map || map->entries.empty()) {
            return std::map<sstring, sstring>{};
@@ -216,6 +243,13 @@ struct uninitialized {
        }
        operations.emplace_back(std::move(key), std::move(update));
    }
+
+    TokenType* getMissingSymbol(IntStreamType* istream, ExceptionBaseType* e,
+                                ANTLR_UINT32 expectedTokenType, BitsetListType* follow) {
+        auto token = BaseType::getMissingSymbol(istream, e, expectedTokenType, follow);
+        _missing_tokens.emplace_back(token);
+        return token;
+    }
 }

@lexer::namespace{cql3_parser}
@@ -233,7 +267,8 @@ struct uninitialized {
 }

@lexer::context {
-    using listener_type = cql3::error_listener<RecognizerType>;
+    using collector_type = cql3::error_collector<ComponentType, ExceptionBaseType::TokenType, ExceptionBaseType>;
+    using listener_type = cql3::error_listener<ComponentType, ExceptionBaseType>;

    listener_type* listener;

@@ -243,19 +278,30 @@ struct uninitialized {

    void displayRecognitionError(ANTLR_UINT8** token_names, ExceptionBaseType* ex)
    {
-        std::stringstream msg;
-        ex->displayRecognitionError(token_names, msg);
-        listener->syntax_error(*this, msg.str());
+        listener->syntax_error(*this, token_names, ex);
+    }
+
+    bool is_eof_token(CommonTokenType token) const
+    {
+        return token == CommonTokenType::TOKEN_EOF;
+    }
+
+    std::string token_text(const TokenType* token) const
+    {
+        if (!token) {
+            return "";
+        }
+        return std::to_string(int(*token));
    }
 }

 /** STATEMENTS **/

-query returns [shared_ptr<parsed_statement> stmnt]
+query returns [shared_ptr<raw::parsed_statement> stmnt]
    : st=cqlStatement (';')* EOF { $stmnt = st; }
    ;

-cqlStatement returns [shared_ptr<parsed_statement> stmt]
+cqlStatement returns [shared_ptr<raw::parsed_statement> stmt]
    @after{ if (stmt) { stmt->set_bound_variables(_bind_variables); } }
    : st1= selectStatement             { $stmt = st1; }
    | st2= insertStatement             { $stmt = st2; }
@@ -273,7 +319,6 @@ cqlStatement returns [shared_ptr<parsed_statement> stmt]
    | st13=dropIndexStatement          { $stmt = st13; }
 #endif
    | st14=alterTableStatement         { $stmt = st14; }
-#if 0
    | st15=alterKeyspaceStatement      { $stmt = st15; }
    | st16=grantStatement              { $stmt = st16; }
    | st17=revokeStatement             { $stmt = st17; }
@@ -282,13 +327,14 @@ cqlStatement returns [shared_ptr<parsed_statement> stmt]
    | st20=alterUserStatement          { $stmt = st20; }
    | st21=dropUserStatement           { $stmt = st21; }
    | st22=listUsersStatement          { $stmt = st22; }
+#if 0
    | st23=createTriggerStatement      { $stmt = st23; }
    | st24=dropTriggerStatement        { $stmt = st24; }
 #endif
    | st25=createTypeStatement         { $stmt = st25; }
-#if 0
    | st26=alterTypeStatement          { $stmt = st26; }
    | st27=dropTypeStatement           { $stmt = st27; }
+#if 0
    | st28=createFunctionStatement     { $stmt = st28; }
    | st29=dropFunctionStatement       { $stmt = st29; }
    | st30=createAggregateStatement    { $stmt = st30; }
@@ -299,8 +345,8 @@ cqlStatement returns [shared_ptr<parsed_statement> stmt]
 /*
 * USE <KEYSPACE>;
 */
-useStatement returns [::shared_ptr<use_statement> stmt]
-    : K_USE ks=keyspaceName { $stmt = ::make_shared<use_statement>(ks); }
+useStatement returns [::shared_ptr<raw::use_statement> stmt]
+    : K_USE ks=keyspaceName { $stmt = ::make_shared<raw::use_statement>(ks); }
    ;

 /**
@@ -309,11 +355,11 @@ useStatement returns [::shared_ptr<use_statement> stmt]
 * WHERE KEY = "key1" AND COL > 1 AND COL < 100
 * LIMIT <NUMBER>;
 */
-selectStatement returns [shared_ptr<select_statement::raw_statement> expr]
+selectStatement returns [shared_ptr<raw::select_statement> expr]
    @init {
        bool is_distinct = false;
        ::shared_ptr<cql3::term::raw> limit;
-        select_statement::parameters::orderings_type orderings;
+        raw::select_statement::parameters::orderings_type orderings;
        bool allow_filtering = false;
    }
    : K_SELECT ( ( K_DISTINCT { is_distinct = true; } )?
@@ -326,8 +372,8 @@ selectStatement returns [shared_ptr<select_statement::raw_statement> expr]
      ( K_LIMIT rows=intValue { limit = rows; } )?
      ( K_ALLOW K_FILTERING  { allow_filtering = true; } )?
      {
-          auto params = ::make_shared<select_statement::parameters>(std::move(orderings), is_distinct, allow_filtering);
-          $expr = ::make_shared<select_statement::raw_statement>(std::move(cf), std::move(params),
+          auto params = ::make_shared<raw::select_statement::parameters>(std::move(orderings), is_distinct, allow_filtering);
+          $expr = ::make_shared<raw::select_statement>(std::move(cf), std::move(params),
            std::move(sclause), std::move(wclause), std::move(limit));
      }
    ;
@@ -381,7 +427,7 @@ whereClause returns [std::vector<cql3::relation_ptr> clause]
    : relation[$clause] (K_AND relation[$clause])*
    ;

-orderByClause[select_statement::parameters::orderings_type& orderings]
+orderByClause[raw::select_statement::parameters::orderings_type& orderings]
    @init{
        bool reversed = false;
    }
@@ -394,7 +440,7 @@ orderByClause[select_statement::parameters::orderings_type& orderings]
 * USING TIMESTAMP <long>;
 *
 */
-insertStatement returns [::shared_ptr<update_statement::parsed_insert> expr]
+insertStatement returns [::shared_ptr<raw::insert_statement> expr]
    @init {
        auto attrs = ::make_shared<cql3::attributes::raw>();
        std::vector<::shared_ptr<cql3::column_identifier::raw>> column_names;
@@ -409,7 +455,7 @@ insertStatement returns [::shared_ptr<update_statement::parsed_insert> expr]
        ( K_IF K_NOT K_EXISTS { if_not_exists = true; } )?
        ( usingClause[attrs] )?
      {
-          $expr = ::make_shared<update_statement::parsed_insert>(std::move(cf),
+          $expr = ::make_shared<raw::insert_statement>(std::move(cf),
                                                   std::move(attrs),
                                                   std::move(column_names),
                                                   std::move(values),
@@ -432,7 +478,7 @@ usingClauseObjective[::shared_ptr<cql3::attributes::raw> attrs]
 * SET name1 = value1, name2 = value2
 * WHERE key = value;
 */
-updateStatement returns [::shared_ptr<update_statement::parsed_update> expr]
+updateStatement returns [::shared_ptr<raw::update_statement> expr]
    @init {
        auto attrs = ::make_shared<cql3::attributes::raw>();
        std::vector<std::pair<::shared_ptr<cql3::column_identifier::raw>, ::shared_ptr<cql3::operation::raw_update>>> operations;
@@ -443,7 +489,7 @@ updateStatement returns [::shared_ptr<update_statement::parsed_update> expr]
      K_WHERE wclause=whereClause
      ( K_IF conditions=updateConditions )?
      {
-          return ::make_shared<update_statement::parsed_update>(std::move(cf),
+          return ::make_shared<raw::update_statement>(std::move(cf),
                                                  std::move(attrs),
                                                  std::move(operations),
                                                  std::move(wclause),
@@ -462,7 +508,7 @@ updateConditions returns [conditions_type conditions]
 * WHERE KEY = keyname
   [IF (EXISTS | name = value, ...)];
 */
-deleteStatement returns [::shared_ptr<delete_statement::parsed> expr]
+deleteStatement returns [::shared_ptr<raw::delete_statement> expr]
    @init {
        auto attrs = ::make_shared<cql3::attributes::raw>();
        std::vector<::shared_ptr<cql3::operation::raw_deletion>> column_deletions;
@@ -474,7 +520,7 @@ deleteStatement returns [::shared_ptr<delete_statement::parsed> expr]
      K_WHERE wclause=whereClause
      ( K_IF ( K_EXISTS { if_exists = true; } | conditions=updateConditions ))?
      {
-          return ::make_shared<delete_statement::parsed>(cf,
+          return ::make_shared<raw::delete_statement>(cf,
                                            std::move(attrs),
                                            std::move(column_deletions),
                                            std::move(wclause),
@@ -521,11 +567,11 @@ usingClauseDelete[::shared_ptr<cql3::attributes::raw> attrs]
 *   ...
 * APPLY BATCH
 */
-batchStatement returns [shared_ptr<cql3::statements::batch_statement::parsed> expr]
+batchStatement returns [shared_ptr<cql3::statements::raw::batch_statement> expr]
    @init {
-        using btype = cql3::statements::batch_statement::type; 
+        using btype = cql3::statements::raw::batch_statement::type; 
        btype type = btype::LOGGED;
-        std::vector<shared_ptr<cql3::statements::modification_statement::parsed>> statements;
+        std::vector<shared_ptr<cql3::statements::raw::modification_statement>> statements;
        auto attrs = make_shared<cql3::attributes::raw>();
    }
    : K_BEGIN
@@ -534,11 +580,11 @@ batchStatement returns [shared_ptr<cql3::statements::batch_statement::parsed> ex
          ( s=batchStatementObjective ';'? { statements.push_back(std::move(s)); } )*
      K_APPLY K_BATCH
      {
-          $expr = ::make_shared<cql3::statements::batch_statement::parsed>(type, std::move(attrs), std::move(statements));
+          $expr = ::make_shared<cql3::statements::raw::batch_statement>(type, std::move(attrs), std::move(statements));
      }
    ;

-batchStatementObjective returns [shared_ptr<cql3::statements::modification_statement::parsed> statement]
+batchStatementObjective returns [shared_ptr<cql3::statements::raw::modification_statement> statement]
    : i=insertStatement  { $statement = i; }
    | u=updateStatement  { $statement = u; }
    | d=deleteStatement  { $statement = d; }
@@ -764,15 +810,18 @@ dropTriggerStatement returns [DropTriggerStatement expr]
      { $expr = new DropTriggerStatement(cf, name.toString(), ifExists); }
    ;

+#endif
+
 /**
 * ALTER KEYSPACE <KS> WITH <property> = <value>;
 */
-alterKeyspaceStatement returns [AlterKeyspaceStatement expr]
-    @init { KSPropDefs attrs = new KSPropDefs(); }
+alterKeyspaceStatement returns [shared_ptr<cql3::statements::alter_keyspace_statement> expr]
+    @init {
+        auto attrs = make_shared<cql3::statements::ks_prop_defs>();
+    }
    : K_ALTER K_KEYSPACE ks=keyspaceName
-        K_WITH properties[attrs] { $expr = new AlterKeyspaceStatement(ks, attrs); }
+        K_WITH properties[attrs] { $expr = make_shared<cql3::statements::alter_keyspace_statement>(ks, attrs); }
    ;
-#endif

 /**
 * ALTER COLUMN FAMILY <CF> ALTER <column> TYPE <newtype>;
@@ -803,26 +852,27 @@ alterTableStatement returns [shared_ptr<alter_table_statement> expr]
    }
    ;

-#if 0
 /**
 * ALTER TYPE <name> ALTER <field> TYPE <newtype>;
 * ALTER TYPE <name> ADD <field> <newtype>;
 * ALTER TYPE <name> RENAME <field> TO <newtype> AND ...;
 */
-alterTypeStatement returns [AlterTypeStatement expr]
+alterTypeStatement returns [::shared_ptr<alter_type_statement> expr]
    : K_ALTER K_TYPE name=userTypeName
-          ( K_ALTER f=ident K_TYPE v=comparatorType { $expr = AlterTypeStatement.alter(name, f, v); }
-          | K_ADD   f=ident v=comparatorType        { $expr = AlterTypeStatement.addition(name, f, v); }
+          ( K_ALTER f=ident K_TYPE v=comparatorType { $expr = ::make_shared<alter_type_statement::add_or_alter>(name, false, f, v); }
+          | K_ADD   f=ident v=comparatorType        { $expr = ::make_shared<alter_type_statement::add_or_alter>(name, true, f, v); }
          | K_RENAME
-               { Map<ColumnIdentifier, ColumnIdentifier> renames = new HashMap<ColumnIdentifier, ColumnIdentifier>(); }
-                 id1=ident K_TO toId1=ident { renames.put(id1, toId1); }
-                 ( K_AND idn=ident K_TO toIdn=ident { renames.put(idn, toIdn); } )*
-               { $expr = AlterTypeStatement.renames(name, renames); }
+               { $expr = ::make_shared<alter_type_statement::renames>(name); }
+               renames[{ static_pointer_cast<alter_type_statement::renames>($expr) }]
          )
    ;
-#endif


+renames[::shared_ptr<alter_type_statement::renames> expr]
+    : fromId=ident K_TO toId=ident { $expr->add_rename(fromId, toId); }
+      ( K_AND renames[$expr] )?
+    ;
+
 /**
 * DROP KEYSPACE [IF EXISTS] <KSP>;
 */
@@ -839,15 +889,15 @@ dropTableStatement returns [::shared_ptr<drop_table_statement> stmt]
    : K_DROP K_COLUMNFAMILY (K_IF K_EXISTS { if_exists = true; } )? cf=columnFamilyName { $stmt = ::make_shared<drop_table_statement>(cf, if_exists); }
    ;

-#if 0
 /**
 * DROP TYPE <name>;
 */
-dropTypeStatement returns [DropTypeStatement stmt]
-    @init { boolean ifExists = false; }
-    : K_DROP K_TYPE (K_IF K_EXISTS { ifExists = true; } )? name=userTypeName { $stmt = new DropTypeStatement(name, ifExists); }
+dropTypeStatement returns [::shared_ptr<drop_type_statement> stmt]
+    @init { bool if_exists = false; }
+    : K_DROP K_TYPE (K_IF K_EXISTS { if_exists = true; } )? name=userTypeName { $stmt = ::make_shared<drop_type_statement>(name, if_exists); }
    ;

+#if 0
 /**
 * DROP INDEX [IF EXISTS] <INDEX_NAME>
 */
@@ -865,120 +915,118 @@ truncateStatement returns [::shared_ptr<truncate_statement> stmt]
    : K_TRUNCATE (K_COLUMNFAMILY)? cf=columnFamilyName { $stmt = ::make_shared<truncate_statement>(cf); }
    ;

-#if 0
 /**
 * GRANT <permission> ON <resource> TO <username>
 */
-grantStatement returns [GrantStatement stmt]
+grantStatement returns [::shared_ptr<grant_statement> stmt]
    : K_GRANT
          permissionOrAll
      K_ON
          resource
      K_TO
          username
-      { $stmt = new GrantStatement($permissionOrAll.perms, $resource.res, $username.text); }
+      { $stmt = ::make_shared<grant_statement>($permissionOrAll.perms, $resource.res, $username.text); } 
    ;

 /**
 * REVOKE <permission> ON <resource> FROM <username>
 */
-revokeStatement returns [RevokeStatement stmt]
+revokeStatement returns [::shared_ptr<revoke_statement> stmt]
    : K_REVOKE
          permissionOrAll
      K_ON
          resource
      K_FROM
          username
-      { $stmt = new RevokeStatement($permissionOrAll.perms, $resource.res, $username.text); }
+      { $stmt = ::make_shared<revoke_statement>($permissionOrAll.perms, $resource.res, $username.text); } 
    ;

-listPermissionsStatement returns [ListPermissionsStatement stmt]
+listPermissionsStatement returns [::shared_ptr<list_permissions_statement> stmt]
    @init {
-        IResource resource = null;
-        String username = null;
-        boolean recursive = true;
+		std::experimental::optional<auth::data_resource> r;
+		std::experimental::optional<sstring> u;
+		bool recursive = true;
    }
    : K_LIST
          permissionOrAll
-      ( K_ON resource { resource = $resource.res; } )?
-      ( K_OF username { username = $username.text; } )?
+      ( K_ON resource { r = $resource.res; } )?
+      ( K_OF username { u = sstring($username.text); } )?
      ( K_NORECURSIVE { recursive = false; } )?
-      { $stmt = new ListPermissionsStatement($permissionOrAll.perms, resource, username, recursive); }
+      { $stmt = ::make_shared<list_permissions_statement>($permissionOrAll.perms, std::move(r), std::move(u), recursive); } 
    ;

-permission returns [Permission perm]
+permission returns [auth::permission perm]
    : p=(K_CREATE | K_ALTER | K_DROP | K_SELECT | K_MODIFY | K_AUTHORIZE)
-    { $perm = Permission.valueOf($p.text.toUpperCase()); }
+    { $perm = auth::permissions::from_string($p.text); }
    ;

-permissionOrAll returns [Set<Permission> perms]
-    : K_ALL ( K_PERMISSIONS )?       { $perms = Permission.ALL_DATA; }
-    | p=permission ( K_PERMISSION )? { $perms = EnumSet.of($p.perm); }
+permissionOrAll returns [auth::permission_set perms]
+    : K_ALL ( K_PERMISSIONS )?       { $perms = auth::permissions::ALL_DATA; }
+    | p=permission ( K_PERMISSION )? { $perms = auth::permission_set::from_mask(auth::permission_set::mask_for($p.perm)); }
    ;

-resource returns [IResource res]
+resource returns [auth::data_resource res]
    : r=dataResource { $res = $r.res; }
    ;

-dataResource returns [DataResource res]
-    : K_ALL K_KEYSPACES { $res = DataResource.root(); }
-    | K_KEYSPACE ks = keyspaceName { $res = DataResource.keyspace($ks.id); }
+dataResource returns [auth::data_resource res]
+    : K_ALL K_KEYSPACES { $res = auth::data_resource(); }
+    | K_KEYSPACE ks = keyspaceName { $res = auth::data_resource($ks.id); }
    | ( K_COLUMNFAMILY )? cf = columnFamilyName
-      { $res = DataResource.columnFamily($cf.name.getKeyspace(), $cf.name.getColumnFamily()); }
+      { $res = auth::data_resource($cf.name->get_keyspace(), $cf.name->get_column_family()); }
    ;

 /**
 * CREATE USER [IF NOT EXISTS] <username> [WITH PASSWORD <password>] [SUPERUSER|NOSUPERUSER]
 */
-createUserStatement returns [CreateUserStatement stmt]
+createUserStatement returns [::shared_ptr<create_user_statement> stmt]
    @init {
-        UserOptions opts = new UserOptions();
-        boolean superuser = false;
-        boolean ifNotExists = false;
+    	auto opts = ::make_shared<cql3::user_options>();
+        bool superuser = false;
+        bool ifNotExists = false;
    }
    : K_CREATE K_USER (K_IF K_NOT K_EXISTS { ifNotExists = true; })? username
      ( K_WITH userOptions[opts] )?
      ( K_SUPERUSER { superuser = true; } | K_NOSUPERUSER { superuser = false; } )?
-      { $stmt = new CreateUserStatement($username.text, opts, superuser, ifNotExists); }
+      { $stmt = ::make_shared<create_user_statement>($username.text, std::move(opts), superuser, ifNotExists); }
    ;

 /**
 * ALTER USER <username> [WITH PASSWORD <password>] [SUPERUSER|NOSUPERUSER]
 */
-alterUserStatement returns [AlterUserStatement stmt]
+alterUserStatement returns [::shared_ptr<alter_user_statement> stmt]
    @init {
-        UserOptions opts = new UserOptions();
-        Boolean superuser = null;
+    	auto opts = ::make_shared<cql3::user_options>();
+    	std::experimental::optional<bool> superuser;
    }
    : K_ALTER K_USER username
      ( K_WITH userOptions[opts] )?
      ( K_SUPERUSER { superuser = true; } | K_NOSUPERUSER { superuser = false; } )?
-      { $stmt = new AlterUserStatement($username.text, opts, superuser); }
+      { $stmt = ::make_shared<alter_user_statement>($username.text, std::move(opts), std::move(superuser)); }
    ;

 /**
 * DROP USER [IF EXISTS] <username>
 */
-dropUserStatement returns [DropUserStatement stmt]
-    @init { boolean ifExists = false; }
-    : K_DROP K_USER (K_IF K_EXISTS { ifExists = true; })? username { $stmt = new DropUserStatement($username.text, ifExists); }
+dropUserStatement returns [::shared_ptr<drop_user_statement> stmt]
+    @init { bool ifExists = false; }
+    : K_DROP K_USER (K_IF K_EXISTS { ifExists = true; })? username { $stmt = ::make_shared<drop_user_statement>($username.text, ifExists); }
    ;

 /**
 * LIST USERS
 */
-listUsersStatement returns [ListUsersStatement stmt]
-    : K_LIST K_USERS { $stmt = new ListUsersStatement(); }
+listUsersStatement returns [::shared_ptr<list_users_statement> stmt]
+    : K_LIST K_USERS { $stmt = ::make_shared<list_users_statement>(); }
    ;

-userOptions[UserOptions opts]
+userOptions[::shared_ptr<cql3::user_options> opts]
    : userOption[opts]
    ;

-userOption[UserOptions opts]
-    : k=K_PASSWORD v=STRING_LITERAL { opts.put($k.text, $v.text); }
+userOption[::shared_ptr<cql3::user_options> opts]
+    : k=K_PASSWORD v=STRING_LITERAL { opts->put($k.text, $v.text); }
    ;
-#endif

 /** DEFINITIONS **/

@@ -1157,7 +1205,8 @@ columnOperation[operations_type& operations]

 columnOperationDifferentiator[operations_type& operations, ::shared_ptr<cql3::column_identifier::raw> key]
    : '=' normalColumnOperation[operations, key]
-    | '[' k=term ']' specializedColumnOperation[operations, key, k]
+    | '[' k=term ']' specializedColumnOperation[operations, key, k, false]
+    | '[' K_SCYLLA_TIMEUUID_LIST_INDEX '(' k=term ')' ']' specializedColumnOperation[operations, key, k, true]
    ;

 normalColumnOperation[operations_type& operations, ::shared_ptr<cql3::column_identifier::raw> key]
@@ -1199,11 +1248,12 @@ normalColumnOperation[operations_type& operations, ::shared_ptr<cql3::column_ide
 specializedColumnOperation[std::vector<std::pair<shared_ptr<cql3::column_identifier::raw>,
                                                 shared_ptr<cql3::operation::raw_update>>>& operations,
                           shared_ptr<cql3::column_identifier::raw> key,
-                           shared_ptr<cql3::term::raw> k]
+                           shared_ptr<cql3::term::raw> k,
+                           bool by_uuid]

    : '=' t=term
      {
-          add_raw_update(operations, key, make_shared<cql3::operation::set_element>(k, t));
+          add_raw_update(operations, key, make_shared<cql3::operation::set_element>(k, t, by_uuid));
      }
    ;

@@ -1383,12 +1433,10 @@ tuple_type returns [shared_ptr<cql3::cql3_type::raw> t]
      '>' { $t = cql3::cql3_type::raw::tuple(std::move(types)); }
    ;

-#if 0
 username
    : IDENT
    | STRING_LITERAL
    ;
-#endif

 // Basically the same as cident, but we need to exlude existing CQL3 types
 // (which for some reason are not reserved otherwise)
@@ -1567,6 +1615,8 @@ K_OR:          O R;
 K_REPLACE:     R E P L A C E;
 K_DETERMINISTIC: D E T E R M I N I S T I C;

+K_SCYLLA_TIMEUUID_LIST_INDEX: S C Y L L A '_' T I M E U U I D '_' L I S T '_' I N D E X;
+
 // Case-insensitive alpha characters
 fragment A: ('a'|'A');
 fragment B: ('b'|'B');
@@ -1612,20 +1662,17 @@ STRING_LITERAL
        setText(txt);
    }
    :
-// FIXME:
-#if 0
      /* pg-style string literal */
      (
-        '\$' '\$'
-        ( /* collect all input until '$$' is reached again */
-          {  (input.size() - input.index() > 1)
-               && !"$$".equals(input.substring(input.index(), input.index() + 1)) }?
-             => c=. { txt.appendCodePoint(c); }
+        '$' '$'
+        (
+          (c=~('$') { txt.push_back(c); })
+          |
+          ('$' (c=~('$') { txt.push_back('$'); txt.push_back(c); }))
        )*
-        '\$' '\$'
+        '$' '$'
      )
      |
-#endif
      /* conventional quoted string literal */
      (
        '\'' (c=~('\'') { txt.push_back(c);} | '\'' '\'' { txt.push_back('\''); })* '\''
--- a/cql3/abstract_marker.cc
+++ b/cql3/abstract_marker.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/abstract_marker.hh
+++ b/cql3/abstract_marker.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/assignment_testable.hh
+++ b/cql3/assignment_testable.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2014 Cloudius Systems
+ * Copyright (C) 2014 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/attributes.cc
+++ b/cql3/attributes.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/attributes.hh
+++ b/cql3/attributes.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/cf_name.cc
+++ b/cql3/cf_name.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/cf_name.hh
+++ b/cql3/cf_name.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/column_condition.cc
+++ b/cql3/column_condition.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/column_condition.hh
+++ b/cql3/column_condition.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/column_identifier.cc
+++ b/cql3/column_identifier.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/cql3/column_identifier.hh
+++ b/cql3/column_identifier.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/column_specification.cc
+++ b/cql3/column_specification.cc
@@ -0,0 +1,56 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*
+ * Copyright (C) 2016 ScyllaDB
+ *
+ * Modified by ScyllaDB
+ */
+
+/*
+ * This file is part of Scylla.
+ *
+ * Scylla is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Scylla is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Scylla.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#include "cql3/column_specification.hh"
+
+namespace cql3 {
+
+bool column_specification::all_in_same_table(const std::vector<::shared_ptr<column_specification>>& names)
+{
+    assert(!names.empty());
+
+    auto first = names.front();
+    return std::all_of(std::next(names.begin()), names.end(), [first] (auto&& spec) {
+        return spec->ks_name == first->ks_name && spec->cf_name == first->cf_name;
+    });
+}
+
+}
--- a/cql3/column_specification.hh
+++ b/cql3/column_specification.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -75,6 +75,8 @@ public:
    bool is_reversed_type() const {
        return ::dynamic_pointer_cast<const reversed_type_impl>(type) != nullptr;
    }
+
+    static bool all_in_same_table(const std::vector<::shared_ptr<column_specification>>& names);
 };

 }
--- a/cql3/constants.cc
+++ b/cql3/constants.cc
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/constants.hh
+++ b/cql3/constants.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
--- a/cql3/cql3_type.cc
+++ b/cql3/cql3_type.cc
@@ -1,5 +1,5 @@
 /*
- * Copyright (C) 2014 Cloudius Systems, Ltd.
+ * Copyright (C) 2014 ScyllaDB
 */

 /*
@@ -148,7 +148,7 @@ public:
        try {
            auto&& ks = db.find_keyspace(_name.get_keyspace());
            try {
-                auto&& type = ks._user_types.get_type(_name.get_user_type_name());
+                auto&& type = ks.metadata()->user_types()->get_type(_name.get_user_type_name());
                if (!_frozen) {
                    throw exceptions::invalid_request_exception("Non-frozen User-Defined types are not supported, please use frozen<>");
                }
--- a/cql3/cql3_type.hh
+++ b/cql3/cql3_type.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 *
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 */

 /*
--- a/cql3/cql_statement.hh
+++ b/cql3/cql_statement.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2014 Cloudius Systems
+ * Copyright (C) 2014 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -58,6 +58,9 @@ class result_message;

 namespace cql3 {

+class metadata;
+shared_ptr<const metadata> make_empty_metadata();
+
 class cql_statement {
 public:
    virtual ~cql_statement()
@@ -70,7 +73,7 @@ public:
     *
     * @param state the current client state
     */
-    virtual void check_access(const service::client_state& state) = 0;
+    virtual future<> check_access(const service::client_state& state) = 0;

    /**
     * Perform additional validation required by the statment.
@@ -102,6 +105,15 @@ public:
    virtual bool depends_on_keyspace(const sstring& ks_name) const = 0;

    virtual bool depends_on_column_family(const sstring& cf_name) const = 0;
+
+    virtual shared_ptr<const metadata> get_result_metadata() const = 0;
+};
+
+class cql_statement_no_metadata : public cql_statement {
+public:
+    virtual shared_ptr<const metadata> get_result_metadata() const override {
+        return make_empty_metadata();
+    }
 };

 }
--- a/cql3/error_collector.hh
+++ b/cql3/error_collector.hh
@@ -17,9 +17,9 @@
 */

 /*
- * Copyright 2015 Cloudius Systems
+ * Copyright (C) 2015 ScyllaDB
 *
- * Modified by Cloudius Systems
+ * Modified by ScyllaDB
 */

 /*
@@ -50,8 +50,8 @@ namespace cql3 {
 /**
 * <code>ErrorListener</code> that collect and enhance the errors send by the CQL lexer and parser.
 */
-template<typename Recognizer>
-class error_collector : public error_listener<Recognizer> {
+template<typename RecognizerType, typename TokenType, typename ExceptionBaseType>
+class error_collector : public error_listener<RecognizerType, ExceptionBaseType> {
    /**
     * The offset of the first token of the snippet.
     */
@@ -81,25 +81,19 @@ public:
     */
    error_collector(const sstring_view& query) : _query(query) {}

-    virtual void syntax_error(Recognizer& recognizer, const std::vector<sstring>& token_names) override {
-        // FIXME: stub
-        syntax_error(recognizer, "Parsing failed, detailed description construction not implemented yet");
+    virtual void syntax_error(RecognizerType& recognizer, ANTLR_UINT8** token_names, ExceptionBaseType* ex) override {
+        auto hdr = get_error_header(ex);
+        auto msg = get_error_message(recognizer, ex, token_names);
+        std::stringstream result;
+        result << hdr << ' ' << msg;
 #if 0
-        String hdr = recognizer.getErrorHeader(e);
-        String msg = recognizer.getErrorMessage(e, tokenNames);
-
-        StringBuilder builder = new StringBuilder().append(hdr)
-                .append(' ')
-                .append(msg);
-
        if (recognizer instanceof Parser)
            appendQuerySnippet((Parser) recognizer, builder);
-
-        errorMsgs.add(builder.toString());
 #endif
+        _error_msgs.emplace_back(result.str());
    }

-    virtual void syntax_error(Recognizer& recognizer, const sstring& msg) override {
+    virtual void syntax_error(RecognizerType& recognizer, const sstring& msg) override {
        _error_msgs.emplace_back(msg);
    }

@@ -114,6 +108,60 @@ public:
        }
    }

+private:
+    std::string get_error_header(ExceptionBaseType* ex) {
+        std::stringstream result;
+        result << "line " << ex->get_line() << ":" << ex->get_charPositionInLine();
+        return result.str();
+    }
+
+    std::string get_error_message(RecognizerType& recognizer, ExceptionBaseType* ex, ANTLR_UINT8** token_names)
+    {
+        using namespace antlr3;
+        std::stringstream msg;
+        switch (ex->getType()) {
+        case ExceptionType::UNWANTED_TOKEN_EXCEPTION: {
+            msg << "extraneous input " << get_token_error_display(recognizer, ex->get_token());
+            if (token_names != nullptr) {
+                std::string token_name;
+                if (recognizer.is_eof_token(ex->get_expecting())) {
+                    token_name = "EOF";
+                } else {
+                    token_name = reinterpret_cast<const char*>(token_names[ex->get_expecting()]);
+                }
+                msg << " expecting " << token_name;
+            }
+            break;
+        }
+        case ExceptionType::MISSING_TOKEN_EXCEPTION: {
+            std::string token_name;
+            if (token_names == nullptr) {
+                token_name = "(" + std::to_string(ex->get_expecting()) + ")";
+            } else {
+                if (recognizer.is_eof_token(ex->get_expecting())) {
+                    token_name = "EOF";
+                } else {
+                    token_name = reinterpret_cast<const char*>(token_names[ex->get_expecting()]);
+                }
+            }
+            msg << "missing " << token_name << " at " << get_token_error_display(recognizer, ex->get_token());
+            break;
+        }
+        case ExceptionType::NO_VIABLE_ALT_EXCEPTION: {
+            msg << "no viable alternative at input " << get_token_error_display(recognizer, ex->get_token());
+            break;
+        }
+        default:
+            ex->displayRecognitionError(token_names, msg);
+        }
+        return msg.str();
+    }
+
+    std::string get_token_error_display(RecognizerType& recognizer, const TokenType* token)
+    {
+        return "'" + recognizer.token_text(token) + "'";
+    }
+
 #if 0

    /**
--- a/Show More
+++ b/Show More