feat(services): Add ScoringFeedbackService for relevance scoring feedback loop

JamesKane · JamesKane · commit 04ebf99d6fc4 · 2026-03-06T13:52:53.000-06:00
- Implemented `ScoringFeedbackService` to learn from curator decisions and adjust relevance scoring weights.
- Added `computeLearnedWeights` and `analyzeFeedback` methods to derive and analyze weight adjustments based on accepted and rejected candidates.
- Updated `RelevanceScoringService` to support dynamic weight application and defaults fallback.
- Enhanced `PublicationDiscoveryService` to integrate feedback-based weight updates before candidate scoring.
- Extended repositories and added unit tests to validate feedback, weight adjustments, and integration behavior.
diff --git a/app/repositories/PublicationCandidateRepository.scala b/app/repositories/PublicationCandidateRepository.scala
@@ -21,6 +21,7 @@ trait PublicationCandidateRepository {
   def bulkReject(ids: Seq[Int], reason: String, reviewedBy: UUID): Future[Int]
   def saveCandidates(candidates: Seq[PublicationCandidate]): Future[Seq[PublicationCandidate]]
   def countByStatus(): Future[Map[String, Int]]
+  def listReviewed(): Future[Seq[PublicationCandidate]]
 }
 
 @Singleton
@@ -131,4 +132,8 @@ class PublicationCandidateRepositoryImpl @Inject()(
       (status, group.length)
     }.result).map(_.toMap)
   }
+
+  override def listReviewed(): Future[Seq[PublicationCandidate]] = {
+    db.run(candidatesTable.filter(c => c.status === "accepted" || c.status === "rejected").result)
+  }
 }
diff --git a/app/services/PublicationDiscoveryService.scala b/app/services/PublicationDiscoveryService.scala
@@ -16,7 +16,8 @@ class PublicationDiscoveryService @Inject()(
                                              publicationRepository: PublicationRepository,
                                              publicationService: PublicationService,
                                              openAlexService: OpenAlexService,
-                                             relevanceScoringService: RelevanceScoringService
+                                             relevanceScoringService: RelevanceScoringService,
+                                             scoringFeedbackService: ScoringFeedbackService
                                            )(implicit ec: ExecutionContext) extends Logging {
 
   def acceptCandidate(candidateId: Int, reviewedBy: java.util.UUID): Future[Option[models.domain.publications.Publication]] = {
@@ -62,62 +63,68 @@ class PublicationDiscoveryService @Inject()(
     candidateRepository.bulkUpdateStatus(candidateIds, "deferred", reviewedBy, None)
   }
 
+  def refreshLearnedWeights(): Future[Option[LearnedWeights]] = {
+    scoringFeedbackService.computeLearnedWeights().map {
+      case Some(weights) =>
+        relevanceScoringService.applyLearnedWeights(weights)
+        Some(weights)
+      case None =>
+        relevanceScoringService.clearLearnedWeights()
+        None
+    }
+  }
+
   def runDiscovery(): Future[Unit] = {
     logger.info("Starting publication discovery run...")
-    
-    searchConfigRepository.getEnabledConfigs().flatMap { configs =>
-      logger.info(s"Found ${configs.size} enabled search configurations.")
-      
-      val runs = configs.map { config =>
-        val startTime = System.currentTimeMillis()
-        
-        // 1. Execute Search
-        openAlexService.searchWorks(config.searchQuery).flatMap { rawCandidates =>
-          
-          // 2. Deduplication
-          // Check against existing Publications
-          val existingDoisFuture = publicationRepository.getAllDois.map(_.toSet)
-          // We should also check against existing candidates to avoid duplicates in the queue
-          // For simplicity, let's assume candidateRepository.saveCandidates handles some level of checking
-          // or we check explicitly here. The repository implementation I wrote filters by OpenAlexId.
-          
-          existingDoisFuture.flatMap { existingDois =>
-            val newCandidates = rawCandidates.filterNot { c =>
-              c.doi.exists(existingDois.contains)
-            }
-            
-            // 3. Calculate Relevance Score using multi-signal scoring
-            val scoredCandidates = relevanceScoringService.scoreCandidates(newCandidates)
-
-            // 4. Save Candidates
-            candidateRepository.saveCandidates(scoredCandidates).flatMap { savedCandidates =>
-              val endTime = System.currentTimeMillis()
-              val duration = (endTime - startTime).toInt
-              
-              // 5. Log Run
-              val run = PublicationSearchRun(
-                id = None,
-                configId = config.id.get,
-                runAt = LocalDateTime.now(),
-                candidatesFound = rawCandidates.size,
-                newCandidates = savedCandidates.size,
-                queryUsed = Some(config.searchQuery),
-                durationMs = Some(duration)
-              )
-              
-              for {
-                _ <- runRepository.create(run)
-                _ <- searchConfigRepository.updateLastRun(config.id.get, LocalDateTime.now())
-              } yield ()
+
+    // Refresh learned weights from curator feedback before scoring new candidates
+    refreshLearnedWeights().flatMap { learnedWeights =>
+      learnedWeights.foreach(w => logger.info(s"Using learned weights from ${w.sampleSize} reviewed candidates."))
+
+      searchConfigRepository.getEnabledConfigs().flatMap { configs =>
+        logger.info(s"Found ${configs.size} enabled search configurations.")
+
+        val runs = configs.map { config =>
+          val startTime = System.currentTimeMillis()
+
+          openAlexService.searchWorks(config.searchQuery).flatMap { rawCandidates =>
+            val existingDoisFuture = publicationRepository.getAllDois.map(_.toSet)
+
+            existingDoisFuture.flatMap { existingDois =>
+              val newCandidates = rawCandidates.filterNot { c =>
+                c.doi.exists(existingDois.contains)
+              }
+
+              val scoredCandidates = relevanceScoringService.scoreCandidates(newCandidates)
+
+              candidateRepository.saveCandidates(scoredCandidates).flatMap { savedCandidates =>
+                val endTime = System.currentTimeMillis()
+                val duration = (endTime - startTime).toInt
+
+                val run = PublicationSearchRun(
+                  id = None,
+                  configId = config.id.get,
+                  runAt = LocalDateTime.now(),
+                  candidatesFound = rawCandidates.size,
+                  newCandidates = savedCandidates.size,
+                  queryUsed = Some(config.searchQuery),
+                  durationMs = Some(duration)
+                )
+
+                for {
+                  _ <- runRepository.create(run)
+                  _ <- searchConfigRepository.updateLastRun(config.id.get, LocalDateTime.now())
+                } yield ()
+              }
             }
+          }.recover {
+            case e: Exception =>
+              logger.error(s"Error running discovery for config '${config.name}' (ID: ${config.id}): ${e.getMessage}", e)
           }
-        }.recover {
-          case e: Exception =>
-            logger.error(s"Error running discovery for config '${config.name}' (ID: ${config.id}): ${e.getMessage}", e)
         }
+
+        Future.sequence(runs).map(_ => logger.info("Publication discovery run completed."))
       }
-      
-      Future.sequence(runs).map(_ => logger.info("Publication discovery run completed."))
     }
   }
 }
diff --git a/app/services/RelevanceScoringService.scala b/app/services/RelevanceScoringService.scala
@@ -5,6 +5,7 @@ import models.domain.publications.PublicationCandidate
 import play.api.libs.json.{JsArray, JsValue}
 import play.api.{Configuration, Logging}
 
+import java.util.concurrent.atomic.AtomicReference
 import scala.concurrent.ExecutionContext
 
 /**
@@ -21,11 +22,38 @@ class RelevanceScoringService @Inject()(
   configuration: Configuration
 )(implicit ec: ExecutionContext) extends Logging {
 
-  // Weights for each scoring component (should sum to 1.0)
-  private val keywordWeight: Double = configuration.getOptional[Double]("publication-discovery.scoring.keywordWeight").getOrElse(0.35)
-  private val conceptWeight: Double = configuration.getOptional[Double]("publication-discovery.scoring.conceptWeight").getOrElse(0.25)
-  private val citationWeight: Double = configuration.getOptional[Double]("publication-discovery.scoring.citationWeight").getOrElse(0.20)
-  private val journalWeight: Double = configuration.getOptional[Double]("publication-discovery.scoring.journalWeight").getOrElse(0.20)
+  // Default weights for each scoring component (should sum to 1.0)
+  private val defaultKeywordWeight: Double = configuration.getOptional[Double]("publication-discovery.scoring.keywordWeight").getOrElse(0.35)
+  private val defaultConceptWeight: Double = configuration.getOptional[Double]("publication-discovery.scoring.conceptWeight").getOrElse(0.25)
+  private val defaultCitationWeight: Double = configuration.getOptional[Double]("publication-discovery.scoring.citationWeight").getOrElse(0.20)
+  private val defaultJournalWeight: Double = configuration.getOptional[Double]("publication-discovery.scoring.journalWeight").getOrElse(0.20)
+
+  // Learned weights from feedback loop (overrides defaults when set)
+  private val learnedWeightsRef: AtomicReference[Option[LearnedWeights]] = new AtomicReference(None)
+
+  def applyLearnedWeights(weights: LearnedWeights): Unit = {
+    learnedWeightsRef.set(Some(weights))
+    logger.info(s"Applied learned weights from ${weights.sampleSize} samples: " +
+      s"keyword=${f"${weights.keywordWeight}%.3f"}, concept=${f"${weights.conceptWeight}%.3f"}, " +
+      s"citation=${f"${weights.citationWeight}%.3f"}, journal=${f"${weights.journalWeight}%.3f"}")
+  }
+
+  def clearLearnedWeights(): Unit = {
+    learnedWeightsRef.set(None)
+    logger.info("Cleared learned weights, reverting to defaults.")
+  }
+
+  def getActiveWeights: (Double, Double, Double, Double) = {
+    learnedWeightsRef.get() match {
+      case Some(lw) => (lw.keywordWeight, lw.conceptWeight, lw.citationWeight, lw.journalWeight)
+      case None => (defaultKeywordWeight, defaultConceptWeight, defaultCitationWeight, defaultJournalWeight)
+    }
+  }
+
+  private def keywordWeight: Double = getActiveWeights._1
+  private def conceptWeight: Double = getActiveWeights._2
+  private def citationWeight: Double = getActiveWeights._3
+  private def journalWeight: Double = getActiveWeights._4
 
   // High-value keywords for genomics/phylogenetics domain
   private[services] val primaryKeywords: Set[String] = Set(
diff --git a/app/services/ScoringFeedbackService.scala b/app/services/ScoringFeedbackService.scala
@@ -0,0 +1,170 @@
+package services
+
+import jakarta.inject.{Inject, Singleton}
+import models.domain.publications.PublicationCandidate
+import play.api.Logging
+import repositories.PublicationCandidateRepository
+
+import scala.concurrent.{ExecutionContext, Future}
+
+/**
+ * Learns from curator accept/reject decisions to improve relevance scoring.
+ *
+ * Analyzes historical decisions by computing per-component score distributions
+ * for accepted vs rejected candidates, then derives adjusted weights that
+ * emphasize components with higher discriminative power.
+ */
+@Singleton
+class ScoringFeedbackService @Inject()(
+  candidateRepository: PublicationCandidateRepository,
+  relevanceScoringService: RelevanceScoringService
+)(implicit ec: ExecutionContext) extends Logging {
+
+  val MinSamplesForFeedback: Int = 10
+
+  /**
+   * Analyze all reviewed candidates and compute learned weight adjustments.
+   * Returns None if insufficient data (< MinSamplesForFeedback reviewed candidates).
+   */
+  def computeLearnedWeights(): Future[Option[LearnedWeights]] = {
+    candidateRepository.listReviewed().map { reviewed =>
+      if (reviewed.size < MinSamplesForFeedback) {
+        logger.info(s"Insufficient reviewed candidates (${reviewed.size}/$MinSamplesForFeedback) for feedback learning.")
+        None
+      } else {
+        val accepted = reviewed.filter(_.status == "accepted")
+        val rejected = reviewed.filter(_.status == "rejected")
+
+        if (accepted.isEmpty || rejected.isEmpty) {
+          logger.info("Need both accepted and rejected candidates for feedback learning.")
+          None
+        } else {
+          Some(deriveWeights(accepted, rejected))
+        }
+      }
+    }
+  }
+
+  /**
+   * Compute a feedback analysis report with per-component statistics.
+   */
+  def analyzeFeedback(): Future[Option[FeedbackAnalysis]] = {
+    candidateRepository.listReviewed().map { reviewed =>
+      val accepted = reviewed.filter(_.status == "accepted")
+      val rejected = reviewed.filter(_.status == "rejected")
+
+      if (accepted.isEmpty && rejected.isEmpty) None
+      else {
+        val acceptedBreakdowns = accepted.map(relevanceScoringService.scoreBreakdown)
+        val rejectedBreakdowns = rejected.map(relevanceScoringService.scoreBreakdown)
+
+        Some(FeedbackAnalysis(
+          totalReviewed = reviewed.size,
+          acceptedCount = accepted.size,
+          rejectedCount = rejected.size,
+          acceptedMeans = computeMeans(acceptedBreakdowns),
+          rejectedMeans = computeMeans(rejectedBreakdowns),
+          componentDiscriminativePower = computeDiscriminativePower(acceptedBreakdowns, rejectedBreakdowns)
+        ))
+      }
+    }
+  }
+
+  private[services] def deriveWeights(
+    accepted: Seq[PublicationCandidate],
+    rejected: Seq[PublicationCandidate]
+  ): LearnedWeights = {
+    val acceptedBreakdowns = accepted.map(relevanceScoringService.scoreBreakdown)
+    val rejectedBreakdowns = rejected.map(relevanceScoringService.scoreBreakdown)
+
+    val discriminativePower = computeDiscriminativePower(acceptedBreakdowns, rejectedBreakdowns)
+
+    // Compute new weights proportional to discriminative power,
+    // blended with original weights for stability (70% original, 30% learned)
+    val blendRatio = 0.3
+    val originalWeights = Map(
+      "keyword" -> relevanceScoringService.scoreBreakdown(accepted.head).keywordWeight,
+      "concept" -> relevanceScoringService.scoreBreakdown(accepted.head).conceptWeight,
+      "citation" -> relevanceScoringService.scoreBreakdown(accepted.head).citationWeight,
+      "journal" -> relevanceScoringService.scoreBreakdown(accepted.head).journalWeight
+    )
+
+    // Normalize discriminative power to sum to 1.0 for use as weights
+    val totalPower = discriminativePower.values.sum
+    val learnedRaw = if (totalPower > 0) {
+      discriminativePower.view.mapValues(_ / totalPower).toMap
+    } else {
+      originalWeights
+    }
+
+    // Blend: new_weight = (1 - blend) * original + blend * learned
+    val blended = originalWeights.map { case (component, origWeight) =>
+      val learnedWeight = learnedRaw.getOrElse(component, origWeight)
+      component -> ((1.0 - blendRatio) * origWeight + blendRatio * learnedWeight)
+    }
+
+    // Normalize blended weights to sum to 1.0
+    val blendedTotal = blended.values.sum
+    val normalized = blended.view.mapValues(_ / blendedTotal).toMap
+
+    logger.info(s"Learned weights from ${accepted.size + rejected.size} reviewed candidates: $normalized")
+
+    LearnedWeights(
+      keywordWeight = normalized("keyword"),
+      conceptWeight = normalized("concept"),
+      citationWeight = normalized("citation"),
+      journalWeight = normalized("journal"),
+      sampleSize = accepted.size + rejected.size,
+      discriminativePower = discriminativePower
+    )
+  }
+
+  /**
+   * Discriminative power = |mean_accepted - mean_rejected| for each component.
+   * Higher values mean the component better separates accepted from rejected.
+   */
+  private[services] def computeDiscriminativePower(
+    acceptedBreakdowns: Seq[ScoringBreakdown],
+    rejectedBreakdowns: Seq[ScoringBreakdown]
+  ): Map[String, Double] = {
+    val acceptedMeans = computeMeans(acceptedBreakdowns)
+    val rejectedMeans = computeMeans(rejectedBreakdowns)
+
+    Map(
+      "keyword" -> math.abs(acceptedMeans.getOrElse("keyword", 0.0) - rejectedMeans.getOrElse("keyword", 0.0)),
+      "concept" -> math.abs(acceptedMeans.getOrElse("concept", 0.0) - rejectedMeans.getOrElse("concept", 0.0)),
+      "citation" -> math.abs(acceptedMeans.getOrElse("citation", 0.0) - rejectedMeans.getOrElse("citation", 0.0)),
+      "journal" -> math.abs(acceptedMeans.getOrElse("journal", 0.0) - rejectedMeans.getOrElse("journal", 0.0))
+    )
+  }
+
+  private[services] def computeMeans(breakdowns: Seq[ScoringBreakdown]): Map[String, Double] = {
+    if (breakdowns.isEmpty) return Map("keyword" -> 0.0, "concept" -> 0.0, "citation" -> 0.0, "journal" -> 0.0)
+
+    val n = breakdowns.size.toDouble
+    Map(
+      "keyword" -> breakdowns.map(_.keywordScore).sum / n,
+      "concept" -> breakdowns.map(_.conceptScore).sum / n,
+      "citation" -> breakdowns.map(_.citationScore).sum / n,
+      "journal" -> breakdowns.map(_.journalScore).sum / n
+    )
+  }
+}
+
+case class LearnedWeights(
+  keywordWeight: Double,
+  conceptWeight: Double,
+  citationWeight: Double,
+  journalWeight: Double,
+  sampleSize: Int,
+  discriminativePower: Map[String, Double]
+)
+
+case class FeedbackAnalysis(
+  totalReviewed: Int,
+  acceptedCount: Int,
+  rejectedCount: Int,
+  acceptedMeans: Map[String, Double],
+  rejectedMeans: Map[String, Double],
+  componentDiscriminativePower: Map[String, Double]
+)
diff --git a/test/services/PublicationDiscoveryServiceSpec.scala b/test/services/PublicationDiscoveryServiceSpec.scala
@@ -19,15 +19,18 @@ class PublicationDiscoveryServiceSpec extends ServiceSpec {
   val mockPubService: PublicationService = mock[PublicationService]
   val mockOpenAlexService: OpenAlexService = mock[OpenAlexService]
   val mockRelevanceScoringService: RelevanceScoringService = mock[RelevanceScoringService]
+  val mockScoringFeedbackService: ScoringFeedbackService = mock[ScoringFeedbackService]
 
   val service = new PublicationDiscoveryService(
     mockSearchConfigRepo, mockCandidateRepo, mockRunRepo,
-    mockPubRepo, mockPubService, mockOpenAlexService, mockRelevanceScoringService
+    mockPubRepo, mockPubService, mockOpenAlexService, mockRelevanceScoringService,
+    mockScoringFeedbackService
   )
 
   override def beforeEach(): Unit = {
     reset(mockSearchConfigRepo, mockCandidateRepo, mockRunRepo,
-      mockPubRepo, mockPubService, mockOpenAlexService, mockRelevanceScoringService)
+      mockPubRepo, mockPubService, mockOpenAlexService, mockRelevanceScoringService,
+      mockScoringFeedbackService)
   }
 
   val reviewerId: UUID = UUID.randomUUID()
diff --git a/test/services/ScoringFeedbackServiceSpec.scala b/test/services/ScoringFeedbackServiceSpec.scala

Original file line number	Diff line number	Diff line change
`@@ -21,6 +21,7 @@ trait PublicationCandidateRepository {`
`21`	`21`	`def bulkReject(ids: Seq[Int], reason: String, reviewedBy: UUID): Future[Int]`
`22`	`22`	`def saveCandidates(candidates: Seq[PublicationCandidate]): Future[Seq[PublicationCandidate]]`
`23`	`23`	`def countByStatus(): Future[Map[String, Int]]`
	`24`	`+ def listReviewed(): Future[Seq[PublicationCandidate]]`
`24`	`25`	`}`
`25`	`26`
`26`	`27`	`@Singleton`
`@@ -131,4 +132,8 @@ class PublicationCandidateRepositoryImpl @Inject()(`
`131`	`132`	`(status, group.length)`
`132`	`133`	`}.result).map(_.toMap)`
`133`	`134`	`}`
	`135`	`+`
	`136`	`+ override def listReviewed(): Future[Seq[PublicationCandidate]] = {`
	`137`	`+ db.run(candidatesTable.filter(c => c.status === "accepted" \|\| c.status === "rejected").result)`
	`138`	`+ }`
`134`	`139`	`}`