rfcx · veckatimest · Jun 19, 2024 · Jun 17, 2024 · Jun 17, 2024 · Jun 18, 2024
diff --git a/core/_cli/migrations/20240404131807-create-best-detections.ts.js b/core/_cli/migrations/20240404131807-create-best-detections.ts.js
@@ -56,46 +56,47 @@ module.exports = {
         )
       `, { transaction: t })
 
-      const jobs = await queryInterface.sequelize.query('select "id", "query_start", "query_end" from public.classifier_jobs', {
-        transaction: t,
-        type: Sequelize.QueryTypes.SELECT,
-        raw: true
-      })
+      // NOT USED SINCE IT'S rewritten in the next migration
+      // const jobs = await queryInterface.sequelize.query('select "id", "query_start", "query_end" from public.classifier_jobs', {
+      //   transaction: t,
+      //   type: Sequelize.QueryTypes.SELECT,
+      //   raw: true
+      // })
 
-      for (const job of jobs) {
-        const replacements = {
-          classifierJobId: job.id,
-          perDayLimit: 10,
-          perStreamLimit: 10,
-          jobStart: job.query_start,
-          jobEnd: job.query_end
-        }
+      // for (const job of jobs) {
+      //   const replacements = {
+      //     classifierJobId: job.id,
+      //     perDayLimit: 10,
+      //     perStreamLimit: 10,
+      //     jobStart: job.query_start,
+      //     jobEnd: job.query_end
+      //   }
 
-        await queryInterface.sequelize.query(`
-          INSERT INTO public.best_detections
-          SELECT
-          "detection_id", "start", "stream_id", "classifier_job_id", "confidence", "daily_ranking", "stream_ranking"
-            FROM (
-              SELECT
-              "id" as "detection_id", "start", "stream_id", "classifier_job_id", "confidence",
-              ROW_NUMBER() OVER(
-                PARTITION BY stream_id, date(timezone('UTC',  "start"))
-                ORDER BY confidence DESC
-              ) as daily_ranking,
-              ROW_NUMBER() OVER(
-                PARTITION BY stream_id
-                ORDER BY confidence DESC
-              ) as stream_ranking
-              FROM public.detections
-              WHERE (start BETWEEN :jobStart AND :jobEnd) AND classifier_job_id = :classifierJobId
-            ) as detection
-          WHERE daily_ranking < :perDayLimit OR stream_ranking < :perStreamLimit;
-        `, {
-          replacements,
-          type: Sequelize.QueryTypes.RAW,
-          transaction: t
-        })
-      }
+      //   await queryInterface.sequelize.query(`
+      //     INSERT INTO public.best_detections
+      //     SELECT
+      //     "detection_id", "start", "stream_id", "classifier_job_id", "confidence", "daily_ranking", "stream_ranking"
+      //       FROM (
+      //         SELECT
+      //         "id" as "detection_id", "start", "stream_id", "classifier_job_id", "confidence",
+      //         ROW_NUMBER() OVER(
+      //           PARTITION BY stream_id, date(timezone('UTC',  "start"))
+      //           ORDER BY confidence DESC
+      //         ) as daily_ranking,
+      //         ROW_NUMBER() OVER(
+      //           PARTITION BY stream_id
+      //           ORDER BY confidence DESC
+      //         ) as stream_ranking
+      //         FROM public.detections
+      //         WHERE (start BETWEEN :jobStart AND :jobEnd) AND classifier_job_id = :classifierJobId
+      //       ) as detection
+      //     WHERE daily_ranking < :perDayLimit OR stream_ranking < :perStreamLimit;
+      //   `, {
+      //     replacements,
+      //     type: Sequelize.QueryTypes.RAW,
+      //     transaction: t
+      //   })
+      // }
     })
   },
   down: async (queryInterface) => {

diff --git a/core/_cli/migrations/20240613065719-best-detections-for-species.js b/core/_cli/migrations/20240613065719-best-detections-for-species.js
@@ -0,0 +1,143 @@
+'use strict'
+
+module.exports = {
+  up: async (queryInterface, Sequelize) => {
+    return queryInterface.sequelize.transaction(async t => {
+      await queryInterface.sequelize.query('DELETE FROM public."best_detections"', {
+        transaction: t
+      })
+
+      await queryInterface.addColumn(
+        'best_detections',
+        'classification_id',
+        {
+          type: Sequelize.INTEGER,
+          allowNull: false,
+          references: {
+            model: {
+              tableName: 'classifications'
+            },
+            key: 'id'
+          }
+        },
+        { transaction: t }
+      )
+      await queryInterface.renameColumn(
+        'best_detections',
+        'daily_ranking',
+        'stream_daily_ranking',
+        { transaction: t }
+      )
+      await queryInterface.addColumn(
+        'best_detections',
+        'stream_classification_ranking',
+        {
+          type: Sequelize.INTEGER,
+          allowNull: false
+        },
+        { transaction: t }
+      )
+      await queryInterface.addColumn(
+        'best_detections',
+        'stream_classification_daily_ranking',
+        {
+          type: Sequelize.INTEGER,
+          allowNull: false
+        },
+        { transaction: t }
+      )
+
+      const jobs = await queryInterface.sequelize.query('select "id", "query_start", "query_end" from public.classifier_jobs', {
+        transaction: t,
+        type: Sequelize.QueryTypes.SELECT,
+        raw: true
+      })
+
+      for (const job of jobs) {
+        const replacements = {
+          classifierJobId: job.id,
+          dayLimit: 10,
+          limit: 10,
+          streamClassificationDayLimit: 5,
+          jobStart: job.query_start,
+          jobEnd: job.query_end
+        }
+
+        await queryInterface.sequelize.query(`
+          INSERT INTO public.best_detections
+          (
+            "detection_id",
+            "start", "stream_id", "classifier_job_id", "confidence", "classification_id",
+            "stream_ranking",
+            "stream_daily_ranking",
+            "stream_classification_ranking",
+            "stream_classification_daily_ranking"
+          )
+          SELECT
+            "detection_id",
+            "start", "stream_id", "classifier_job_id", "confidence", "classification_id"
+            "stream_ranking",
+            "stream_daily_ranking",
+            "stream_classification_ranking",
+            "stream_classification_daily_ranking",
+          FROM (
+              SELECT
+              "id" as "detection_id",
+              "start", "stream_id", "classifier_job_id", "confidence", "classification_id",
+              ROW_NUMBER() OVER(
+                PARTITION BY stream_id
+                ORDER BY confidence DESC
+              ) as stream_ranking,
+              ROW_NUMBER() OVER(
+                PARTITION BY stream_id, date(timezone('UTC',  "start"))
+                ORDER BY confidence DESC
+              ) as stream_daily_ranking,
+              ROW_NUMBER() OVER(
+                PARTITION BY stream_id, classification_id
+                ORDER BY confidence DESC
+              ) as stream_classification_ranking,
+              ROW_NUMBER() OVER(
+                PARTITION BY stream_id, classification_id, date(timezone('UTC',  "start"))
+                ORDER BY confidence DESC
+              ) as stream_classification_daily_ranking
+              FROM public.detections
+              WHERE (start BETWEEN :jobStart AND :jobEnd) AND classifier_job_id = :classifierJobId
+            ) as detection
+          WHERE stream_ranking < :limit OR stream_classification_ranking < :limit OR
+                stream_daily_ranking < :dayLimit OR
+                stream_classification_daily_ranking < :streamClassificationDayLimit;`,
+        {
+          replacements,
+          type: Sequelize.QueryTypes.RAW,
+          transaction: t
+        })
+      }
+    })
+  },
+
+  down: async (queryInterface, Sequelize) => {
+    return queryInterface.sequelize.transaction(async t => {
+      await queryInterface.removeColumn(
+        'best_detections',
+        'classification_id',
+        { transaction: t }
+      )
+      await queryInterface.renameColumn(
+        'best_detections',
+        'stream_daily_ranking',
+        'daily_ranking',
+        { transaction: t }
+      )
+      await queryInterface.removeColumn(
+        'best_detections',
+        'stream_classification_ranking',
+        { transaction: t }
+      )
+      await queryInterface.removeColumn(
+        'best_detections',
+        'stream_classification_daily_ranking',
+        { transaction: t }
+      )
+    })
+  }
+}
diff --git a/core/_models/detections/best-detection.js b/core/_models/detections/best-detection.js
@@ -21,13 +21,25 @@ module.exports = (sequelize, DataTypes) => {
       type: DataTypes.FLOAT,
       allowNull: false
     },
-    dailyRanking: {
+    classificationId: {
       type: DataTypes.INTEGER,
-      allowNull: false
+      allowNull: true
     },
     streamRanking: {
       type: DataTypes.INTEGER,
       allowNull: false
+    },
+    streamDailyRanking: {
+      type: DataTypes.INTEGER,
+      allowNull: false
+    },
+    streamClassificationRanking: {
+      type: DataTypes.INTEGER,
+      allowNull: false
+    },
+    streamClassificationDailyRanking: {
+      type: DataTypes.INTEGER,
+      allowNull: false
     }
   }, {
     underscored: true,
@@ -36,6 +48,7 @@ module.exports = (sequelize, DataTypes) => {
   BestDetection.associate = function (models) {
     BestDetection.belongsTo(models.Detection, { as: 'detection', foreignKey: 'detection_id' })
     BestDetection.belongsTo(models.ClassifierJob, { as: 'classifier_job', foreignKey: 'classifier_job_id' })
+    BestDetection.belongsTo(models.Classification, { as: 'classification', foreignKey: 'classification_id' })
   }
   return BestDetection
 }
diff --git a/core/_models/detections/detection.js b/core/_models/detections/detection.js
@@ -41,7 +41,7 @@ module.exports = (sequelize, DataTypes) => {
     Detection.hasOne(models.BestDetection, { as: 'bestDetection', foreignKey: 'detection_id' })
   }
   Detection.attributes = {
-    lite: ['stream_id', 'start', 'end', 'confidence'],
+    lite: ['id', 'stream_id', 'start', 'end', 'confidence'],
     full: ['id', 'stream_id', 'classifier_id', 'classification_id', 'classifier_job_id', 'start', 'end', 'confidence', 'review_status']
   }
   return Detection

diff --git a/core/detections/best-detections-summary.int.test.js b/core/detections/best-detections-summary.int.test.js
@@ -93,11 +93,6 @@ let classifierJobs = [
   }
 ]
 
-afterAll(async () => {
-  await models.BestDetection.destroy({ where: {} })
-  await models.Detection.destroy({ where: {} })
-})
-
 function oneDetection (partialDetection) {
   return {
     streamId: streams[0].id,
@@ -123,21 +118,24 @@ let job2Stream1Day2BestDetection
 async function makeManyDetections () {
   const arbitraryDetections = []
   streams.forEach((stream) => {
-    // we want 6 days of detections, 20 detections each day
-    for (let day = 1; day < 7; day++) {
-      let date = new Date('2024-01-01T08:00:00.000Z').setUTCDate(day).valueOf()
-
-      for (let i = 0; i < 20; i++) {
-        arbitraryDetections.push(oneDetection({
-          streamId: stream.id,
-          start: new Date(date),
-          end: new Date(date + 5000),
-          confidence: 0.7 + Math.random() / 10
-        }))
-
-        date += 60 * 60 * 1000
+    classifications.forEach((classification) => {
+      // we want 6 days of detections, 20 detections each day
+      for (let day = 1; day < 7; day++) {
+        let date = new Date('2024-01-01T08:00:00.000Z').setUTCDate(day).valueOf()
+
+        for (let i = 0; i < 10; i++) {
+          arbitraryDetections.push(oneDetection({
+            streamId: stream.id,
+            classificationId: classification.id,
+            start: new Date(date),
+            end: new Date(date + 5000),
+            confidence: 0.7 + Math.random() / 10
+          }))
+
+          date += 60 * 60 * 1000
+        }
       }
-    }
+    })
   })
 
   stream1Day1BestDetection = oneDetection({
@@ -211,11 +209,15 @@ async function makeManyDetections () {
 
 beforeAll(async () => {
   muteConsole('warn')
-  await truncateNonBase()
+  await truncateNonBase(models)
+
+  await models.ClassifierJob.destroy({ where: {}, force: true })
+  await models.Classifier.destroy({ where: {}, force: true })
 
   await models.Project.create(project)
   await models.Stream.bulkCreate(streams)
   await models.Classification.bulkCreate(classifications)
+
   await models.Classifier.bulkCreate(classifiers)
   classifierJobs = await models.ClassifierJob.bulkCreate(classifierJobs)
 
@@ -229,7 +231,7 @@ beforeAll(async () => {
 describe('GET /classifier-jobs/:id/best-detections/summary', () => {
   test('should return right best per stream detections', async () => {
     const query = {
-      n_per_stream: 2
+      n_per_chunk: 2
     }
 
     const response = await request(app).get(`/${classifierJobs[0].id}/best-detections/summary`).query(query)
@@ -245,7 +247,7 @@ describe('GET /classifier-jobs/:id/best-detections/summary', () => {
   test('should return right best per day detections', async () => {
     const query = {
       by_date: true,
-      n_per_stream: 2,
+      n_per_chunk: 2,
       start: '2024-01-01T00:00:00.000Z',
       end: '2024-01-04T00:00:00.000Z'
     }
@@ -263,7 +265,7 @@ describe('GET /classifier-jobs/:id/best-detections/summary', () => {
   test('should respect stream_ids in best per day', async () => {
     const query = {
       by_date: true,
-      n_per_stream: 1,
+      n_per_chunk: 1,
       start: '2024-01-01T00:00:00.000Z',
       end: '2024-01-04T00:00:00.000Z',
       streams: [streams[0].id, streams[1].id]
@@ -281,7 +283,7 @@ describe('GET /classifier-jobs/:id/best-detections/summary', () => {
   test('should respect stream_ids in best per stream', async () => {
     const query = {
       by_date: false,
-      n_per_stream: 2,
+      n_per_chunk: 2,
       streams: [streams[0].id, streams[1].id]
     }
 
@@ -297,7 +299,7 @@ describe('GET /classifier-jobs/:id/best-detections/summary', () => {
   test('should respect review statuses', async () => {
     const query = {
       by_date: false,
-      n_per_stream: 10, // max
+      n_per_chunk: 10, // max
       review_statuses: ['uncertain', 'confirmed']
     }
 
@@ -316,7 +318,7 @@ describe('GET /classifier-jobs/:id/best-detections/summary', () => {
   test('should only find detections in requested job', async () => {
     const query = {
       by_date: false,
-      n_per_stream: 10 // max
+      n_per_chunk: 10 // max
     }
 
     const response = await request(app).get(`/${classifierJobs[1].id}/best-detections/summary`).query(query)