locationtech · pomadchin · Feb 22, 2019 · Dec 21, 2018 · Dec 21, 2018 · Feb 11, 2019
diff --git a/accumulo/src/main/scala/geotrellis/spark/io/accumulo/AccumuloLayerDeleter.scala b/accumulo/src/main/scala/geotrellis/spark/io/accumulo/AccumuloLayerDeleter.scala
@@ -16,19 +16,21 @@
 
 package geotrellis.spark.io.accumulo
 
-import geotrellis.spark.LayerId
+import geotrellis.spark.{Boundable, LayerId}
 import geotrellis.spark.io._
-
 import com.typesafe.scalalogging.LazyLogging
+import geotrellis.spark.io.avro.AvroRecordCodec
 import org.apache.accumulo.core.client.{BatchWriterConfig, Connector}
 import org.apache.accumulo.core.security.Authorizations
 import org.apache.accumulo.core.data.{Range => AccumuloRange}
+import spray.json.JsonFormat
 
 import scala.collection.JavaConverters._
+import scala.reflect.ClassTag
 
 class AccumuloLayerDeleter(val attributeStore: AttributeStore, connector: Connector) extends LazyLogging with LayerDeleter[LayerId] {
 
-  def delete(id: LayerId): Unit = {
+  def delete[K: ClassTag](id: LayerId): Unit = {
     try {
       val header = attributeStore.readHeader[AccumuloLayerHeader](id)
       val numThreads = 1

diff --git a/accumulo/src/main/scala/geotrellis/spark/io/accumulo/AccumuloLayerManager.scala b/accumulo/src/main/scala/geotrellis/spark/io/accumulo/AccumuloLayerManager.scala
@@ -32,8 +32,8 @@ import scala.reflect.ClassTag
 
 class AccumuloLayerManager(attributeStore: AccumuloAttributeStore, instance: AccumuloInstance)(implicit sc: SparkContext)
     extends LayerManager[LayerId]{
-  def delete(id: LayerId): Unit =
-    AccumuloLayerDeleter(attributeStore, instance).delete(id)
+  def delete[K: ClassTag](id: LayerId): Unit =
+    AccumuloLayerDeleter(attributeStore, instance).delete[K](id)
 
   def copy[
     K: AvroRecordCodec: Boundable: JsonFormat: ClassTag,

diff --git a/accumulo/src/main/scala/geotrellis/spark/io/accumulo/AccumuloLayerReindexer.scala b/accumulo/src/main/scala/geotrellis/spark/io/accumulo/AccumuloLayerReindexer.scala
@@ -75,9 +75,9 @@ class AccumuloLayerReindexer(
     val layerCopier = AccumuloLayerCopier(attributeStore, layerReader, layerWriter)
 
     layerWriter.write(tmpId, layerReader.read[K, V, M](id), keyIndex)
-    layerDeleter.delete(id)
+    layerDeleter.delete[K](id)
     layerCopier.copy[K, V, M](tmpId, id)
-    layerDeleter.delete(tmpId)
+    layerDeleter.delete[K](tmpId)
   }
 
   def reindex[
@@ -99,8 +99,8 @@ class AccumuloLayerReindexer(
     val layerCopier = AccumuloLayerCopier(attributeStore, layerReader, layerWriter)
 
     layerWriter.write(tmpId, layerReader.read[K, V, M](id), keyIndexMethod.createIndex(existingKeyIndex.keyBounds))
-    layerDeleter.delete(id)
+    layerDeleter.delete[K](id)
     layerCopier.copy[K, V, M](tmpId, id)
-    layerDeleter.delete(tmpId)
+    layerDeleter.delete[K](tmpId)
   }
 }
diff --git a/cassandra/src/main/resources/reference.conf b/cassandra/src/main/resources/reference.conf
@@ -13,19 +13,27 @@
 # limitations under the License.
 
 geotrellis.cassandra {
-  port                 = 9042
-  catalog              = "metadata"
-  keyspace             = "geotrellis"
-  replicationStrategy  = "SimpleStrategy"
-  replicationFactor    = 1
-  localDc              = "datacenter1"
+  port = 9042
+  catalog = "metadata"
+  keyspace = "geotrellis"
+  replicationStrategy = "SimpleStrategy"
+  replicationFactor = 1
+  localDc = "datacenter1"
   usedHostsPerRemoteDc = 0
   allowRemoteDCsForLocalConsistencyLevel = false
+  # 'writeoptimized' or 'readoptimized', default is 'writeoptimized'.
+  # For 'readoptimized', clients can configure the maximum size of a partition
+  # read based on tiles in the partition.  Careful tuning of this value can
+  # lead to optimized read performance when using key/partition caching.
+  indexStrategy = "writeoptimized"
+  # Only relevant if partitionStrategy is 'readoptimized' - configures the
+  # maximum number of tiles to store per parition.
+#  tilesPerParition = 64
   threads {
     collection.read = default
     rdd {
       write = default
-      read  = default
+      read = default
     }
   }
-}
+}
diff --git a/cassandra/src/main/scala/geotrellis/spark/io/cassandra/CassandraCollectionLayerReader.scala b/cassandra/src/main/scala/geotrellis/spark/io/cassandra/CassandraCollectionLayerReader.scala
@@ -45,7 +45,7 @@ class CassandraCollectionLayerReader(val attributeStore: AttributeStore, instanc
 
     val decompose = (bounds: KeyBounds[K]) => keyIndex.indexRanges(bounds)
 
-    val seq = CassandraCollectionReader.read[K, V](instance, header.keyspace, header.tileTable, id, queryKeyBounds, decompose, filterIndexOnly, Some(writerSchema))
+    val seq = CassandraCollectionReader.read[K, V](instance, header.keyspace, header.tileTable, id, queryKeyBounds, decompose, filterIndexOnly, Some(writerSchema), keyIndex)
     new ContextCollection(seq, layerMetadata)
   }
 }

diff --git a/cassandra/src/main/scala/geotrellis/spark/io/cassandra/CassandraCollectionReader.scala b/cassandra/src/main/scala/geotrellis/spark/io/cassandra/CassandraCollectionReader.scala
@@ -21,16 +21,12 @@ import geotrellis.spark.io._
 import geotrellis.spark.io.avro.codecs.KeyValueRecordCodec
 import geotrellis.spark.io.avro.{AvroEncoder, AvroRecordCodec}
 import geotrellis.spark.io.cassandra.conf.CassandraConfig
-import geotrellis.spark.io.index.MergeQueue
+import geotrellis.spark.io.index.{KeyIndex, MergeQueue}
 import geotrellis.spark.util.KryoWrapper
-
 import org.apache.avro.Schema
-import com.datastax.driver.core.querybuilder.QueryBuilder
-import com.datastax.driver.core.querybuilder.QueryBuilder.{eq => eqs}
 
 import scala.collection.JavaConverters._
 import scala.reflect.ClassTag
-
 import java.math.BigInteger
 
 object CassandraCollectionReader {
@@ -45,10 +41,13 @@ object CassandraCollectionReader {
     decomposeBounds: KeyBounds[K] => Seq[(BigInt, BigInt)],
     filterIndexOnly: Boolean,
     writerSchema: Option[Schema] = None,
+    keyIndex: KeyIndex[K],
     threads: Int = defaultThreadCount
   ): Seq[(K, V)] = {
     if (queryKeyBounds.isEmpty) return Seq.empty[(K, V)]
 
+    val indexStrategy = new CassandraIndexing[K](keyIndex, instance.cassandraConfig.tilesPerPartition)
+
     val includeKey = (key: K) => queryKeyBounds.includeKey(key)
     val _recordCodec = KeyValueRecordCodec[K, V]
     val kwWriterSchema = KryoWrapper(writerSchema) //Avro Schema is not Serializable
@@ -58,18 +57,20 @@ object CassandraCollectionReader {
     else
       queryKeyBounds.flatMap(decomposeBounds)
 
-    val query = QueryBuilder.select("value")
-      .from(keyspace, table)
-      .where(eqs("key", QueryBuilder.bindMarker()))
-      .and(eqs("name", layerId.name))
-      .and(eqs("zoom", layerId.zoom))
-      .toString
+    val query = indexStrategy.queryValueStatement(
+      instance.cassandraConfig.indexStrategy,
+      keyspace, table, layerId.name, layerId.zoom
+    )
 
     instance.withSessionDo { session =>
-      val statement = session.prepare(query)
+      val statement = indexStrategy.prepareQuery(query)(session)
 
       LayerReader.njoin[K, V](ranges.toIterator, threads){ index: BigInt =>
-        val row = session.execute(statement.bind(index: BigInteger))
+        val row = session.execute(indexStrategy.bindQuery(
+          instance.cassandraConfig.indexStrategy,
+          statement, index: BigInteger
+        ))
+
         if (row.asScala.nonEmpty) {
           val bytes = row.one().getBytes("value").array()
           val recs = AvroEncoder.fromBinary(kwWriterSchema.value.getOrElse(_recordCodec.schema), bytes)(_recordCodec)