womboai · MsRandom · Oct 22, 2024 · Oct 22, 2024 · Oct 22, 2024 · Oct 22, 2024
diff --git a/miner/miner/submit.py b/miner/miner/submit.py
@@ -147,6 +147,7 @@ def start_benchmarking(submission: CheckpointSubmission):
         baseline = generate_baseline(
             inputs,
             BASELINE_MODEL_DIRECTORY,
+            switch_user=False,
             cache=True,
         )
         save_baseline_cache(baseline)
@@ -159,7 +160,6 @@ def start_benchmarking(submission: CheckpointSubmission):
 
     compare_checkpoints(
         ModelRepositoryInfo(url=submission.get_repo_link(), revision=submission.revision),
-        [],
         inputs,
         baseline,
         MODEL_DIRECTORY,

diff --git a/neuron/neuron/submission_tester/__init__.py b/neuron/neuron/submission_tester/__init__.py
@@ -3,4 +3,3 @@
 from .testing import *
 from .metrics import *
 from .vram_monitor import *
-from .hash import *
diff --git a/neuron/neuron/submission_tester/hash.py b/neuron/neuron/submission_tester/hash.py
diff --git a/neuron/neuron/submission_tester/metrics.py b/neuron/neuron/submission_tester/metrics.py
@@ -25,7 +25,6 @@ class CheckpointBenchmark(BaseModel):
     model: MetricData
     average_similarity: float
     min_similarity: float
-    image_hash: bytes
 
     def calculate_score(self, baseline_metrics: MetricData) -> float:
         if self.min_similarity < SIMILARITY_SCORE_THRESHOLD:

diff --git a/neuron/neuron/submission_tester/testing.py b/neuron/neuron/submission_tester/testing.py
@@ -1,26 +1,19 @@
 import logging
-from collections.abc import Iterable
 from concurrent.futures import ThreadPoolExecutor, CancelledError
-from io import BytesIO
 from pathlib import Path
 from statistics import mean
 from threading import Event
 from time import perf_counter
 
-import imagehash
-from PIL import Image
-
 from pipelines import TextToImageRequest
 from . import InvalidSubmissionError
-from .hash import load_image_hash, save_image_hash, GENERATION_TIME_DIFFERENCE_THRESHOLD
 from .inference_sandbox import InferenceSandbox
 from .metrics import CheckpointBenchmark, MetricData, BaselineBenchmark
 from .vram_monitor import VRamMonitor
 from .. import (
     GenerationOutput,
     ModelRepositoryInfo,
     CURRENT_CONTEST,
-    Key,
     OutputComparator,
 )
 
@@ -100,7 +93,6 @@ def generate_baseline(
 
 def compare_checkpoints(
     submission: ModelRepositoryInfo,
-    existing_benchmarks: Iterable[tuple[Key, CheckpointBenchmark | None]],
     inputs: list[TextToImageRequest],
     baseline: BaselineBenchmark,
     sandbox_directory: Path = SANDBOX_DIRECTORY,
@@ -115,8 +107,6 @@ def compare_checkpoints(
     with InferenceSandbox(submission, False, sandbox_directory, switch_user, cache) as sandbox:
         size = sandbox.model_size
 
-        image_hash = None
-
         try:
             f"Take {len(inputs)} samples, keeping track of how fast/accurate generations have been"
             for index, request in enumerate(inputs):
@@ -127,32 +117,6 @@ def compare_checkpoints(
 
                 output = generate(sandbox, request)
 
-                if not image_hash:
-                    with BytesIO(output.output) as data:
-                        image_hash = imagehash.average_hash(Image.open(data))
-
-                        image_hash_bytes = save_image_hash(image_hash)
-
-                        match = next(
-                            (
-                                (key, existing_benchmark)
-                                for key, existing_benchmark in existing_benchmarks
-                                if (
-                                    existing_benchmark and
-                                    not (image_hash - load_image_hash(existing_benchmark.image_hash)) and
-                                    abs(output.generation_time - existing_benchmark.model.generation_time) < GENERATION_TIME_DIFFERENCE_THRESHOLD
-                                )
-                            ),
-                            None,
-                        )
-
-                        if match:
-                            key, benchmark = match
-
-                            logger.info(f"Submission {submission} marked as duplicate of hotkey {key}'s submission")
-
-                            return benchmark
-
                 logger.info(
                     f"Sample {index + 1} Generated\n"
                     f"Generation Time: {output.generation_time}s\n"
@@ -171,7 +135,7 @@ def compare_checkpoints(
     with CURRENT_CONTEST.output_comparator() as output_comparator:
         def calculate_similarity(comparator: OutputComparator, baseline_output: GenerationOutput, optimized_output: GenerationOutput):
             try:
-                if cancelled_event.is_set():
+                if cancelled_event and cancelled_event.is_set():
                     raise CancelledError()
 
                 return comparator(
@@ -205,7 +169,6 @@ def calculate_similarity(comparator: OutputComparator, baseline_output: Generati
         ),
         average_similarity=average_similarity,
         min_similarity=min_similarity,
-        image_hash=image_hash_bytes,
     )
 
     logger.info(

diff --git a/validator/submission_tester/benchmarker.py b/validator/submission_tester/benchmarker.py
@@ -62,7 +62,6 @@ def _benchmark_key(self, hotkey: Key):
         try:
             self.benchmarks[hotkey] = compare_checkpoints(
                 submission,
-                self.benchmarks.items(),
                 self.inputs,
                 self.baseline,
                 cancelled_event=self.cancelled_event,

diff --git a/validator/weight_setting/deduplication.py b/validator/weight_setting/deduplication.py
diff --git a/validator/weight_setting/validator.py b/validator/weight_setting/validator.py
@@ -42,16 +42,14 @@
     BENCHMARKS_VERSION,
 )
 from neuron.submission_tester import (
-    load_image_hash,
     CheckpointBenchmark,
     MetricData,
 )
 from .benchmarking_api import BenchmarkingApi, benchmarking_api
-from .deduplication import find_duplicates, PotentiallyDuplicateSubmissionInfo
 from .wandb_args import add_wandb_args
-from .winner_selection import get_scores, get_contestant_scores
+from .winner_selection import get_scores, get_contestant_scores, get_tiers
 
-VALIDATOR_VERSION: tuple[int, int, int] = (4, 2, 1)
+VALIDATOR_VERSION: tuple[int, int, int] = (4, 3, 0)
 VALIDATOR_VERSION_STRING = ".".join(map(str, VALIDATOR_VERSION))
 
 WEIGHTS_VERSION = (
@@ -123,8 +121,6 @@ class Validator:
     benchmarking_state: BenchmarkState
     failed: set[int] = set()  # for backwards depickling compatibility
     invalid: dict[int, str]
-    hash_prompt: str
-    hash_seed: int
     contest: Contest
 
     def __init__(self):
@@ -550,7 +546,10 @@ def set_weights(self):
 
         logger.info("Setting weights")
 
-        weights = get_scores(get_contestant_scores(self.benchmarks, self.baseline_metrics), len(self.metagraph.nodes))
+        contestants = get_contestant_scores(self.benchmarks, self.baseline_metrics)
+        tiers = get_tiers(contestants)
+        blocks = [info.block if info else None for info in self.contest_state.miner_info]
+        weights = get_scores(tiers, blocks, len(self.metagraph.nodes))
 
         self.send_wandb_metrics()
 
@@ -848,19 +847,6 @@ async def do_step(self, block: int):
             )
             logger.info(self.benchmarks)
 
-            benchmark_duplicate_info = [
-                PotentiallyDuplicateSubmissionInfo(
-                    image_hash=load_image_hash(benchmark.image_hash),
-                    generation_time=benchmark.model.generation_time,
-                    block=self.contest_state.miner_info[uid].block,
-                ) if benchmark else None
-                for uid, benchmark in enumerate(self.benchmarks)
-            ]
-
-            for duplicate_uid, original_uid in find_duplicates(benchmark_duplicate_info):
-                self.benchmarks[duplicate_uid] = None
-                self.invalid[duplicate_uid] = f"Duplicate of UID {original_uid}'s submission"
-
             self.benchmarking = False
             self.step += 1
 

diff --git a/validator/weight_setting/winner_selection.py b/validator/weight_setting/winner_selection.py
@@ -1,8 +1,10 @@
 from operator import itemgetter
 
+from neuron import Uid
 from neuron.submission_tester import CheckpointBenchmark, MetricData
 
 TIER_SCORE_IMPROVEMENT_THRESHOLD = 1.05
+WINNER_PERCENTAGE = 0.5
 
 
 def get_contestant_scores(benchmarks: list[CheckpointBenchmark | None], baseline_metrics: MetricData):
@@ -17,23 +19,56 @@ def get_contestant_scores(benchmarks: list[CheckpointBenchmark | None], baseline
     return sorted_contestants
 
 
-def get_scores(contestants: list[tuple[int, float]], node_count: int) -> list[float]:
+def get_tiers(contestants: list[tuple[Uid, float]]) -> list[list[Uid]]:
     if not contestants:
         return []
 
     _, last_tier_score = contestants[0]
 
-    scores = [0.0] * node_count
-    tier = 1
+    tiers = [[]]
 
     for contestant in contestants:
         uid, score = contestant
 
         if score > last_tier_score * TIER_SCORE_IMPROVEMENT_THRESHOLD:
-            # No longer in top threshold
+            # New tier
             last_tier_score = score
-            tier += 1
+            tiers.append([])
+
+        tiers[-1].append(uid)
+
+    return tiers
+
+
+def get_scores(tiers: list[list[Uid]], blocks: list[int | None], node_count: int) -> list[float]:
+    if not tiers:
+        return [1.0] * node_count
+
+    ordered_tiers = [
+        sorted(tier, key=blocks.__getitem__) for tier in tiers
+    ]
+
+    modified_tiers = []
+
+    last_tier = None
+
+    for tier in ordered_tiers:
+        if last_tier:
+            modified_tiers.append([tier[0], *last_tier[1:]])
+        else:
+            modified_tiers.append([tier[0]])
+
+        last_tier = tier
+
+    modified_tiers.append(last_tier[1:])
+
+    scores = [0.0] * node_count
+
+    for index, tier in enumerate(modified_tiers):
+        incentive_pool = WINNER_PERCENTAGE * ((1 - WINNER_PERCENTAGE) ** index)
+        score = incentive_pool / len(tier)
 
-        scores[uid] = (score + 1) ** (tier * 0.75)
+        for uid in tier:
+            scores[uid] = score
 
     return scores