Cryptonomic · vishakh · Sep 14, 2021 · Aug 9, 2021 · Aug 12, 2021 · vishakh
diff --git a/...ala/tech/cryptonomic/conseil/api/routes/platform/data/tezos/TezosDataOperationsTest.scala b/...ala/tech/cryptonomic/conseil/api/routes/platform/data/tezos/TezosDataOperationsTest.scala
@@ -6,18 +6,11 @@ import com.softwaremill.diffx.scalatest.DiffMatcher
 import org.scalatest.concurrent.IntegrationPatience
 import slick.jdbc.PostgresProfile.api._
 import tech.cryptonomic.conseil.api.TezosInMemoryDatabaseSetup
-import tech.cryptonomic.conseil.common.generic.chain.DataTypes.{Query, _}
+import tech.cryptonomic.conseil.common.generic.chain.DataTypes.{Query, SimpleField, _}
 import tech.cryptonomic.conseil.common.testkit.{ConseilSpec, InMemoryDatabase}
-import tech.cryptonomic.conseil.common.tezos.Tables.{
-  AccountsHistoryRow,
-  AccountsRow,
-  BlocksRow,
-  FeesRow,
-  OperationGroupsRow,
-  OperationsRow
-}
+import tech.cryptonomic.conseil.common.tezos.Tables.{AccountsHistoryRow, AccountsRow, BlocksRow, FeesRow, OperationGroupsRow, OperationsRow}
 import tech.cryptonomic.conseil.common.tezos.{Fork, Tables}
-import tech.cryptonomic.conseil.common.tezos.TezosTypes.{makeAccountId, TezosBlockHash}
+import tech.cryptonomic.conseil.common.tezos.TezosTypes.{TezosBlockHash, makeAccountId}
 
 import scala.concurrent.duration._
 
@@ -2111,7 +2104,7 @@ class TezosDataOperationsTest
           Aggregation(
             field = "medium",
             function = AggregationType.count,
-            Some(
+            predicate = Some(
               AggregationPredicate(
                 operation = OperationType.gt,
                 set = List(1),
@@ -2169,7 +2162,7 @@ class TezosDataOperationsTest
           Aggregation(
             field = "medium",
             function = AggregationType.count,
-            Some(
+            predicate = Some(
               AggregationPredicate(
                 operation = OperationType.gt,
                 set = List(0),
@@ -2180,7 +2173,7 @@ class TezosDataOperationsTest
           Aggregation(
             field = "low",
             function = AggregationType.sum,
-            Some(
+            predicate = Some(
               AggregationPredicate(
                 operation = OperationType.eq,
                 set = List(0),
@@ -2271,6 +2264,46 @@ class TezosDataOperationsTest
 
       }
 
+    "aggregate with distinct count aggregation" in {
+      val feesTmp = List(
+        FeesRow(1, 1, 1, Timestamp.valueOf("2000-01-01 00:00:00"), "kind", forkId = Fork.mainForkId),
+        FeesRow(2, 1, 1, Timestamp.valueOf("2000-01-02 00:00:00"), "kind", forkId = Fork.mainForkId),
+        FeesRow(3, 2, 1, Timestamp.valueOf("2000-01-02 00:00:00"), "kind", forkId = Fork.mainForkId),
+        FeesRow(4, 2, 1, Timestamp.valueOf("2000-01-02 00:00:00"), "kind", forkId = Fork.mainForkId),
+        FeesRow(5, 3, 2, Timestamp.valueOf("2000-01-03 00:00:00"), "kind", forkId = Fork.mainForkId),
+        FeesRow(6, 3, 2, Timestamp.valueOf("2000-01-03 00:00:00"), "kind", forkId = Fork.mainForkId)
+      )
+
+      val aggregate = List(
+        Aggregation("low", AggregationType.count),
+        Aggregation("medium", AggregationType.countDistinct)
+      )
+
+      val populateAndTest = for {
+        _ <- Tables.Fees ++= feesTmp
+        found <- sut.selectWithPredicates(
+          "tezos",
+          table = Tables.Fees.baseTableRow.tableName,
+          columns = List(SimpleField("low"), SimpleField("medium"), SimpleField("high")),
+          predicates = List.empty,
+          ordering = List(QueryOrdering("count_distinct_medium", OrderDirection.desc)),
+          aggregation = aggregate,
+          temporalPartition = None,
+          snapshot = None,
+          outputType = OutputType.json,
+          limit = 10
+        )
+      } yield found
+
+      val result = dbHandler.run(populateAndTest.transactionally).futureValue
+
+      result shouldBe List(
+        Map("count_low" -> Some(4), "count_distinct_medium" -> Some(2), "high" -> Some(1)),
+        Map("count_low" -> Some(2), "count_distinct_medium" -> Some(1), "high" -> Some(2))
+      )
+    }
+
+
       "map date with datePart aggregation when it is only type of aggregation" in {
         val feesTmp = List(
           FeesRow(0, 1, 4, Timestamp.valueOf("2000-01-01 00:00:00"), "kind", forkId = Fork.mainForkId),

diff --git a/conseil-common/src/main/scala/tech/cryptonomic/conseil/common/generic/chain/DataTypes.scala b/conseil-common/src/main/scala/tech/cryptonomic/conseil/common/generic/chain/DataTypes.scala
@@ -24,7 +24,7 @@ object DataTypes {
   /** Method checks if type can be aggregated */
   lazy val canBeAggregated: DataType => AggregationType => Boolean = { dataType =>
     {
-      case AggregationType.count => true
+      case AggregationType.count | AggregationType.countDistinct => true
       case AggregationType.max | AggregationType.min =>
         Set(DataType.Decimal, DataType.Int, DataType.LargeInt, DataType.DateTime, DataType.Currency)(dataType)
       case AggregationType.avg | AggregationType.sum =>
@@ -249,7 +249,7 @@ object DataTypes {
     /** Helper method for extracting prefixes needed for SQL */
     def prefixes: List[String] = values.toList.map(_.toString + "_")
     type AggregationType = Value
-    val sum, count, max, min, avg = Value
+    val sum, count, max, min, avg, countDistinct = Value
   }
 
   /** Enumeration of aggregation functions */

diff --git a/conseil-common/src/main/scala/tech/cryptonomic/conseil/common/util/DatabaseUtil.scala b/conseil-common/src/main/scala/tech/cryptonomic/conseil/common/util/DatabaseUtil.scala
@@ -326,6 +326,7 @@ object DatabaseUtil {
       aggregationType match {
         case AggregationType.sum => s"SUM($column)"
         case AggregationType.count => s"COUNT($column)"
+        case AggregationType.countDistinct => s"COUNT(DISTINCT $column)"
         case AggregationType.max => s"MAX($column)"
         case AggregationType.min => s"MIN($column)"
         case AggregationType.avg => s"AVG($column)"
@@ -336,6 +337,7 @@ object DatabaseUtil {
       aggregationType match {
         case AggregationType.sum => s"sum_$column"
         case AggregationType.count => s"count_$column"
+        case AggregationType.countDistinct => s"count_distinct_$column"
         case AggregationType.max => s"max_$column"
         case AggregationType.min => s"min_$column"
         case AggregationType.avg => s"avg_$column"

diff --git a/...rre/src/main/scala/tech/cryptonomic/conseil/indexer/tezos/bigmaps/BigMapsOperations.scala b/...rre/src/main/scala/tech/cryptonomic/conseil/indexer/tezos/bigmaps/BigMapsOperations.scala
@@ -27,6 +27,7 @@ import tech.cryptonomic.conseil.common.tezos.TezosTypes.BlockTagged.fromBlockDat
   */
 case class BigMapsOperations[Profile <: ExPostgresProfile](profile: Profile) extends ConseilLogSupport {
   import profile.api._
+  import io.scalaland.chimney.dsl._
 
   /** Create an action to find and copy big maps based on the diff contained in the blocks
     *
@@ -95,7 +96,10 @@ case class BigMapsOperations[Profile <: ExPostgresProfile](profile: Profile) ext
           DBIO.sequence {
             List(
               Tables.BigMapContents.insertOrUpdateAll(rowsToWrite),
-              Tables.BigMapContentsHistory ++= updateData.map(Tables.BigMapContentsHistoryRow.tupled).distinct
+              Tables.BigMapContentsHistory ++= updateData
+                    .map(BigMapContentsRow.tupled)
+                    .map(_.transformInto[Tables.BigMapContentsHistoryRow])
+                    .distinct
             )
           }
         }