feat!: Added support for Blockchain-based federated training using Et…

…hereum.
ertis-research · Sep 7, 2024 · 44252b1 · 44252b1
1 parent f4ceb28
commit 44252b1
Show file tree

Hide file tree

Showing 44 changed files with 3,010 additions and 917 deletions.
diff --git a/README.md b/README.md
@@ -734,8 +734,8 @@ steps:
 7. Install the libraries and execute the frontend:
    ```bash
    cd frontend
-   npm install
-   npm i -g @angular/cli
+   npm install # nvm install 10 & nvm use 10.24.1
+   npm i -g @angular/cli@9.1.15
    ng build -c production
    docker build --tag localhost:5000/frontend .
    docker push localhost:5000/frontend

diff --git a/backend/automl/models.py b/backend/automl/models.py
@@ -1,134 +1,138 @@
-from django.db import models
-from django.utils.timezone import now
-from django.conf import settings
-from model_utils import Choices
-from model_utils.fields import StatusField, MonitorField
-
-class MLModel(models.Model):
-    """Machine learning model to be trained in the system"""
-
-    name = models.CharField(unique=True, max_length=30)
-    description = models.CharField(max_length=100, blank=True)
-    imports = models.TextField(blank=True)
-    code = models.TextField()
-    distributed = models.BooleanField(default=False)
-    father = models.OneToOneField('self', null=True, blank=True, default=None, related_name='child', on_delete=models.SET_NULL)
-    framework = models.TextField()
-
-class Configuration(models.Model):
-    """Set of ML models to be used for training"""
-
-    name = models.CharField(unique=True, max_length=30)
-    description = models.CharField(max_length=100, blank=True)
-    ml_models = models.ManyToManyField(MLModel)
-    time = models.DateTimeField(default=now, editable=False)
-
-    class Meta(object):
-        ordering = ('-time', )
-
-class Deployment(models.Model):
-    """Deployment of a configuration of models for training"""
-
-    # General Deployment Settings
-    batch = models.IntegerField(default=1)
-    tf_kwargs_fit = models.CharField(max_length=100, blank=True)
-    tf_kwargs_val = models.CharField(max_length=100, blank=True)
-    pth_kwargs_fit = models.CharField(max_length=100, blank=True)
-    pth_kwargs_val = models.CharField(max_length=100, blank=True)
-    conf_mat_settings = models.BooleanField(default=False, blank=True, null=True)
-    configuration = models.ForeignKey(Configuration, related_name='deployments', on_delete=models.CASCADE)
-    time = models.DateTimeField(default=now, editable=False)
-
-    # Distributed Deployment Settings
-    optimizer = models.TextField(default='adam', blank=True)
-    learning_rate = models.DecimalField(max_digits=7, decimal_places=6, default=0.001, blank=True)
-    loss = models.TextField(default='sparse_categorical_crossentropy', blank=True)
-    metrics = models.TextField(default='sparse_categorical_accuracy', blank=True)
-
-    # Incremental Deployment Settings
-    incremental = models.BooleanField(default=False)
-    indefinite = models.BooleanField(default=False)
-    stream_timeout = models.IntegerField(default=60000, blank=True, null=True)
-    monitoring_metric = models.TextField(blank=True, null=True)
-    change = models.TextField(blank=True, null=True)
-    improvement = models.DecimalField(max_digits=7, decimal_places=6, blank=True, null=True, default=0.05)
-
-    # Unsupervised Deployment Settings
-    unsupervised = models.BooleanField(default=False)
-    unsupervised_rounds = models.IntegerField(default=5, blank=True, null=True)
-    confidence = models.DecimalField(max_digits=7, decimal_places=6, blank=True, null=True, default=0.9)
-
-    # Federated Deployment Settings
-    federated = models.BooleanField(default=False)
-    agg_rounds = models.IntegerField(default=15, blank=True, null=True)
-    min_data = models.IntegerField(default=1000, blank=True, null=True)
-    AGGREGATION_STRATEGIES = Choices('FedAvg', 'FedOpt', 'FedAdagrad', 'FedAdam', 'FedYogi')
-    agg_strategy = StatusField(choices_name='AGGREGATION_STRATEGIES')
-    data_restriction = models.JSONField(default=dict, blank=True, null=True)
-
-    class Meta(object):
-        ordering = ('-time', )
-
-class TrainingResult(models.Model):
-    """Training result information obtained once deployed a model"""
-
-    STATUS = Choices('created', 'deployed', 'stopped', 'finished')
-    """Sets its default value to the first item in the STATUS choices:"""
-    status = StatusField()
-    status_changed = MonitorField(monitor='status')
-    deployment = models.ForeignKey(Deployment, default=None, related_name='results', on_delete=models.CASCADE)
-    model = models.ForeignKey(MLModel, related_name='trained', on_delete=models.CASCADE)
-    train_metrics = models.JSONField(blank=True, null=True)
-    val_metrics = models.JSONField(blank=True, null=True)
-    test_metrics = models.JSONField(blank=True, null=True)
-    confusion_matrix = models.JSONField(blank=True, null=True, default=None)
-    training_time = models.DecimalField(max_digits=14, decimal_places=4, blank=True, null=True)
-    trained_model = models.FileField(upload_to=settings.TRAINED_MODELS_DIR, blank=True)
-    confusion_mat_img = models.FileField(upload_to=settings.TRAINED_MODELS_DIR, blank=True, null=True)
-
-    class Meta(object):
-        ordering = ('-status_changed', )
-
-class Datasource(models.Model):
-    """Datasource used for training a deployed model"""
-
-    INPUT_FORMAT = Choices('RAW', 'AVRO', 'JSON', 'TELEGRAF_STR_JSON')
-    """Sets its default value to the first item in the STATUS choices:"""
-    input_format = StatusField(choices_name='INPUT_FORMAT')
-    deployment = models.TextField() 
-    input_config = models.TextField(blank=True) 
-    description = models.TextField(blank=True)
-    topic = models.TextField()
-    total_msg = models.IntegerField(blank=True, null=True)
-    validation_rate = models.DecimalField(max_digits=7, decimal_places=6, blank=True, null=True)
-    test_rate = models.DecimalField(max_digits=7, decimal_places=6, blank=True, null=True)
-    time = models.DateTimeField()
-
-    class Meta(object):
-        ordering = ('-time', )
-
-class Inference(models.Model):
-    """Training result information obtained once deployed a model"""
-    INPUT_FORMAT = Choices('RAW', 'AVRO', 'JSON', 'TELEGRAF_STR_JSON')
-    STATUS = Choices('deployed', 'stopped')
-    """Sets its default value to the first item in the STATUS choices:"""
-
-    status = StatusField()
-    status_changed = MonitorField(monitor='status')
-    model_result = models.ForeignKey(TrainingResult, null=True, related_name='inferences', on_delete=models.SET_NULL)
-    replicas = models.IntegerField(default=1)
-    input_format = StatusField(choices_name='INPUT_FORMAT')
-    input_config = models.TextField(blank=True)
-    input_topic = models.TextField(blank=True)
-    output_topic = models.TextField(blank=True)
-    time = models.DateTimeField(default=now, editable=False)
-    limit = models.DecimalField(max_digits=15, decimal_places=10, blank=True,  null=True)
-    output_upper = models.TextField(blank=True)
-    token = models.TextField(blank=True, default=None, null=True)
-    external_host = models.TextField(blank=True, default=None, null=True)
-    input_kafka_broker = models.TextField(blank=True, default=None, null=True)
-    output_kafka_broker = models.TextField(blank=True, default=None, null=True)
-    upper_kafka_broker = models.TextField(blank=True, default=None, null=True)
-
-    class Meta(object):
-        ordering = ('-time', )
+from django.db import models
+from django.utils.timezone import now
+from django.conf import settings
+from model_utils import Choices
+from model_utils.fields import StatusField, MonitorField
+
+class MLModel(models.Model):
+    """Machine learning model to be trained in the system"""
+
+    name = models.CharField(unique=True, max_length=30)
+    description = models.CharField(max_length=100, blank=True)
+    imports = models.TextField(blank=True)
+    code = models.TextField()
+    distributed = models.BooleanField(default=False)
+    father = models.OneToOneField('self', null=True, blank=True, default=None, related_name='child', on_delete=models.SET_NULL)
+    framework = models.TextField()
+
+class Configuration(models.Model):
+    """Set of ML models to be used for training"""
+
+    name = models.CharField(unique=True, max_length=30)
+    description = models.CharField(max_length=100, blank=True)
+    ml_models = models.ManyToManyField(MLModel)
+    time = models.DateTimeField(default=now, editable=False)
+
+    class Meta(object):
+        ordering = ('-time', )
+
+class Deployment(models.Model):
+    """Deployment of a configuration of models for training"""
+
+    # General Deployment Settings
+    batch = models.IntegerField(default=1)
+    tf_kwargs_fit = models.CharField(max_length=100, blank=True)
+    tf_kwargs_val = models.CharField(max_length=100, blank=True)
+    pth_kwargs_fit = models.CharField(max_length=100, blank=True)
+    pth_kwargs_val = models.CharField(max_length=100, blank=True)
+    conf_mat_settings = models.BooleanField(default=False, blank=True, null=True)
+    configuration = models.ForeignKey(Configuration, related_name='deployments', on_delete=models.CASCADE)
+    time = models.DateTimeField(default=now, editable=False)
+
+    # Distributed Deployment Settings
+    optimizer = models.TextField(default='adam', blank=True)
+    learning_rate = models.DecimalField(max_digits=7, decimal_places=6, default=0.001, blank=True)
+    loss = models.TextField(default='sparse_categorical_crossentropy', blank=True)
+    metrics = models.TextField(default='sparse_categorical_accuracy', blank=True)
+
+    # Incremental Deployment Settings
+    incremental = models.BooleanField(default=False)
+    indefinite = models.BooleanField(default=False)
+    stream_timeout = models.IntegerField(default=60000, blank=True, null=True)
+    monitoring_metric = models.TextField(blank=True, null=True)
+    change = models.TextField(blank=True, null=True)
+    improvement = models.DecimalField(max_digits=7, decimal_places=6, blank=True, null=True, default=0.05)
+
+    # Unsupervised Deployment Settings
+    unsupervised = models.BooleanField(default=False)
+    unsupervised_rounds = models.IntegerField(default=5, blank=True, null=True)
+    confidence = models.DecimalField(max_digits=7, decimal_places=6, blank=True, null=True, default=0.9)
+
+    # Federated Deployment Settings
+    federated = models.BooleanField(default=False)
+    agg_rounds = models.IntegerField(default=15, blank=True, null=True)
+    min_data = models.IntegerField(default=1000, blank=True, null=True)
+    AGGREGATION_STRATEGIES = Choices('FedAvg', 'FedOpt', 'FedAdagrad', 'FedAdam', 'FedYogi')
+    agg_strategy = StatusField(choices_name='AGGREGATION_STRATEGIES')
+    data_restriction = models.JSONField(default=dict, blank=True, null=True)
+
+    # Federated Blockchain Deployment Settings
+    blockchain = models.BooleanField(default=False)
+
+
+    class Meta(object):
+        ordering = ('-time', )
+
+class TrainingResult(models.Model):
+    """Training result information obtained once deployed a model"""
+
+    STATUS = Choices('created', 'deployed', 'stopped', 'finished')
+    """Sets its default value to the first item in the STATUS choices:"""
+    status = StatusField()
+    status_changed = MonitorField(monitor='status')
+    deployment = models.ForeignKey(Deployment, default=None, related_name='results', on_delete=models.CASCADE)
+    model = models.ForeignKey(MLModel, related_name='trained', on_delete=models.CASCADE)
+    train_metrics = models.JSONField(blank=True, null=True)
+    val_metrics = models.JSONField(blank=True, null=True)
+    test_metrics = models.JSONField(blank=True, null=True)
+    confusion_matrix = models.JSONField(blank=True, null=True, default=None)
+    training_time = models.DecimalField(max_digits=14, decimal_places=4, blank=True, null=True)
+    trained_model = models.FileField(upload_to=settings.TRAINED_MODELS_DIR, blank=True)
+    confusion_mat_img = models.FileField(upload_to=settings.TRAINED_MODELS_DIR, blank=True, null=True)
+
+    class Meta(object):
+        ordering = ('-status_changed', )
+
+class Datasource(models.Model):
+    """Datasource used for training a deployed model"""
+
+    INPUT_FORMAT = Choices('RAW', 'AVRO', 'JSON', 'TELEGRAF_STR_JSON')
+    """Sets its default value to the first item in the STATUS choices:"""
+    input_format = StatusField(choices_name='INPUT_FORMAT')
+    deployment = models.TextField() 
+    input_config = models.TextField(blank=True) 
+    description = models.TextField(blank=True)
+    topic = models.TextField()
+    total_msg = models.IntegerField(blank=True, null=True)
+    validation_rate = models.DecimalField(max_digits=7, decimal_places=6, blank=True, null=True)
+    test_rate = models.DecimalField(max_digits=7, decimal_places=6, blank=True, null=True)
+    time = models.DateTimeField()
+
+    class Meta(object):
+        ordering = ('-time', )
+
+class Inference(models.Model):
+    """Training result information obtained once deployed a model"""
+    INPUT_FORMAT = Choices('RAW', 'AVRO', 'JSON', 'TELEGRAF_STR_JSON')
+    STATUS = Choices('deployed', 'stopped')
+    """Sets its default value to the first item in the STATUS choices:"""
+
+    status = StatusField()
+    status_changed = MonitorField(monitor='status')
+    model_result = models.ForeignKey(TrainingResult, null=True, related_name='inferences', on_delete=models.SET_NULL)
+    replicas = models.IntegerField(default=1)
+    input_format = StatusField(choices_name='INPUT_FORMAT')
+    input_config = models.TextField(blank=True)
+    input_topic = models.TextField(blank=True)
+    output_topic = models.TextField(blank=True)
+    time = models.DateTimeField(default=now, editable=False)
+    limit = models.DecimalField(max_digits=15, decimal_places=10, blank=True,  null=True)
+    output_upper = models.TextField(blank=True)
+    token = models.TextField(blank=True, default=None, null=True)
+    external_host = models.TextField(blank=True, default=None, null=True)
+    input_kafka_broker = models.TextField(blank=True, default=None, null=True)
+    output_kafka_broker = models.TextField(blank=True, default=None, null=True)
+    upper_kafka_broker = models.TextField(blank=True, default=None, null=True)
+
+    class Meta(object):
+        ordering = ('-time', )