SFI-Visual-Intelligence
diff --git a/‎deepcluster/earlystopping.py
+82 b/‎deepcluster/earlystopping.py
+82
diff --git a/‎not_in_use/.DS_Store
8 KB b/‎not_in_use/.DS_Store
8 KB
diff --git a/‎sup/main_echogram_supervised_3classes.py renamed to ‎not_in_use/main_echogram_supervised_3classes.py b/‎sup/main_echogram_supervised_3classes.py renamed to ‎not_in_use/main_echogram_supervised_3classes.py
diff --git a/‎semi/01p/main_echogram_semi_3classes.py renamed to ‎not_in_use/semi_01p/main_echogram_semi_3classes.py
+1-1 b/‎semi/01p/main_echogram_semi_3classes.py renamed to ‎not_in_use/semi_01p/main_echogram_semi_3classes.py
+1-1
diff --git a/‎semi/20p/main_echogram_semi_3classes.py renamed to ‎not_in_use/semi_20p/main_echogram_semi_3classes.py
+1-1 b/‎semi/20p/main_echogram_semi_3classes.py renamed to ‎not_in_use/semi_20p/main_echogram_semi_3classes.py
+1-1
diff --git a/‎supclust/01p/main_echogram_supclust_3classes.py renamed to ‎not_in_use/supclust_01p/main_echogram_supclust_3classes.py b/‎supclust/01p/main_echogram_supclust_3classes.py renamed to ‎not_in_use/supclust_01p/main_echogram_supclust_3classes.py
diff --git a/‎supclust/20p/main_echogram_supclust_3classes.py renamed to ‎not_in_use/supclust_20p/main_echogram_supclust_3classes.py b/‎supclust/20p/main_echogram_supclust_3classes.py renamed to ‎not_in_use/supclust_20p/main_echogram_supclust_3classes.py
diff --git a/‎unbalsemi/01p/main_echogram_unbal_semi_3classes.py renamed to ‎not_in_use/unbalsemi_01p/main_echogram_unbal_semi_3classes.py b/‎unbalsemi/01p/main_echogram_unbal_semi_3classes.py renamed to ‎not_in_use/unbalsemi_01p/main_echogram_unbal_semi_3classes.py
diff --git a/‎unbalsemi/20p/main_echogram_unbal_semi_3classes.py renamed to ‎not_in_use/unbalsemi_20p/main_echogram_unbal_semi_3classes.py b/‎unbalsemi/20p/main_echogram_unbal_semi_3classes.py renamed to ‎not_in_use/unbalsemi_20p/main_echogram_unbal_semi_3classes.py
diff --git a/‎semi/.DS_Store
0 Bytes b/‎semi/.DS_Store
0 Bytes
diff --git a/‎semi/02p/main_echogram_semi_3classes.py
+157-74 b/‎semi/02p/main_echogram_semi_3classes.py
+157-74
diff --git a/‎sup/.DS_Store
0 Bytes b/‎sup/.DS_Store
0 Bytes
diff --git a/‎supclust/.DS_Store
0 Bytes b/‎supclust/.DS_Store
0 Bytes
diff --git a/‎unbalsemi/.DS_Store
0 Bytes b/‎unbalsemi/.DS_Store
0 Bytes
@@ -0,0 +1,82 @@
+from typing import List
+import copy
+import operator
+from enum import Enum, auto
+import numpy as np
+
+from torch.nn import Module
+
+
+class StopVariable(Enum):
+    LOSS = auto()
+    ACCURACY = auto()
+    NONE = auto()
+
+
+class Best(Enum):
+    RANKED = auto()
+    ALL = auto()
+
+# , StopVariable.LOSS
+stopping_args = dict(
+        stop_varnames=[StopVariable.ACCURACY],
+        patience=100, max_epochs=1000, remember=Best.RANKED)
+
+
+class EarlyStopping:
+    def __init__(
+            self, model: Module, stop_varnames: List[StopVariable],
+            patience: int = 100, max_epochs: int = 1000, remember: Best = Best.RANKED):
+        self.model = model
+        self.comp_ops = []
+        self.stop_vars = []
+        self.best_vals = []
+        for stop_varname in stop_varnames:
+            if stop_varname is StopVariable.LOSS:
+                self.stop_vars.append('loss')
+                self.comp_ops.append(operator.le)
+                self.best_vals.append(np.inf)
+            elif stop_varname is StopVariable.ACCURACY:
+                self.stop_vars.append('acc')
+                self.comp_ops.append(operator.ge)
+                self.best_vals.append(-np.inf)
+        self.remember = remember
+        self.remembered_vals = copy.copy(self.best_vals)
+        self.max_patience = patience
+        self.patience = self.max_patience
+        self.max_epochs = max_epochs
+        self.best_epoch = None
+        self.best_state = None
+
+    def check(self, values: List[np.floating], epoch: int) -> bool:
+        checks = [self.comp_ops[i](val, self.best_vals[i])
+                  for i, val in enumerate(values)]
+        if any(checks):
+            self.best_vals = np.choose(checks, [self.best_vals, values])
+            self.patience = self.max_patience
+
+            comp_remembered = [
+                    self.comp_ops[i](val, self.remembered_vals[i])
+                    for i, val in enumerate(values)]
+            if self.remember is Best.ALL:
+                if all(comp_remembered):
+                    self.best_epoch = epoch
+                    self.remembered_vals = copy.copy(values)
+                    self.best_state = {
+                            key: value.cpu() for key, value
+                            in self.model.state_dict().items()}
+            elif self.remember is Best.RANKED:
+                for i, comp in enumerate(comp_remembered):
+                    if comp:
+                        if not(self.remembered_vals[i] == values[i]):
+                            self.best_epoch = epoch
+                            self.remembered_vals = copy.copy(values)
+                            self.best_state = {
+                                    key: value.cpu() for key, value
+                                    in self.model.state_dict().items()}
+                            break
+                    else:
+                        break
+        else:
+            self.patience -= 1
+        return self.patience == 0
@@ -25,7 +25,7 @@
 import matplotlib.pyplot as plt
 
 current_dir = os.getcwd()
-sys.path.append(os.path.join(current_dir, '..', '..', 'deepcluster'))
+sys.path.append(os.path.join(current_dir, '../../semi', '..', 'deepcluster'))
 
 import paths
 import clustering
 
@@ -25,7 +25,7 @@
 import matplotlib.pyplot as plt
 
 current_dir = os.getcwd()
-sys.path.append(os.path.join(current_dir, '..', '..', 'deepcluster'))
+sys.path.append(os.path.join(current_dir, '../../semi', '..', 'deepcluster'))
 
 import paths
 import clustering
 
@@ -46,6 +46,7 @@
 from batch.data_transform_functions.db_with_limits import db_with_limits_img
 from batch.combine_functions import CombineFunctions
 from classifier_linearSVC import SimpleClassifier
+from earlystopping import EarlyStopping, stopping_args
 
 def parse_args():
     current_dir = os.getcwd()
@@ -357,6 +358,75 @@ def sampling_echograms_test(args):
 
     return dataset_test_bal, dataset_test_unbal
 
+def produce_test_result_bal(epoch, model, dataloader_test_bal, dataset_test_bal, device, args, deepcluster):
+    model.classifier = nn.Sequential(*list(model.classifier.children())[:-1]) # remove ReLU at classifier [:-1]
+    model.cluster_layer = None
+    model.category_layer = None
+
+    print('TEST set: Cluster the features')
+    features_te_bal, input_tensors_te_bal, labels_te_bal = compute_features(dataloader_test_bal, model, len(dataset_test_bal),
+                                                                device=device, args=args)
+    clustering_loss_te_bal, pca_features_te_bal = deepcluster.cluster(features_te_bal, verbose=args.verbose)
+
+    mlp = list(model.classifier.children()) # classifier that ends with linear(512 * 128). No ReLU at the end
+    mlp.append(nn.ReLU(inplace=True).to(device))
+    model.classifier = nn.Sequential(*mlp)
+    model.classifier.to(device)
+
+    # nan_location_bal = np.isnan(pca_features_te_bal)
+    # inf_location_bal = np.isinf(pca_features_te_bal)
+    # if (not np.allclose(nan_location_bal, 0)) or (not np.allclose(inf_location_bal, 0)):
+    #     print('PCA: Feature NaN or Inf found. Nan count: ', np.sum(nan_location_bal), ' Inf count: ',
+    #           np.sum(inf_location_bal))
+    #     print('Skip epoch ', epoch)
+    #     torch.save(pca_features_te_bal, 'te_pca_NaN_%d_bal.pth.tar' % epoch)
+    #     torch.save(features_te_bal, 'te_feature_NaN_%d_bal.pth.tar' % epoch)
+    #     continue
+
+    # save patches per epochs
+    cp_epoch_out_bal = [features_te_bal, deepcluster.images_lists, deepcluster.images_dist_lists, input_tensors_te_bal,
+                    labels_te_bal]
+    with open(os.path.join(args.exp, 'bal', 'features', 'cp_epoch_%d_te_bal.pickle' % epoch), "wb") as f:
+        pickle.dump(cp_epoch_out_bal, f)
+    with open(os.path.join(args.exp, 'bal', 'pca_features',  'pca_epoch_%d_te_bal.pickle' % epoch), "wb") as f:
+        pickle.dump(pca_features_te_bal, f)
+    return 0
+
+def produce_test_result_unbal(epoch, model, dataloader_test_unbal, dataset_test_unbal, device, args, deepcluster):
+    model.classifier = nn.Sequential(*list(model.classifier.children())[:-1]) # remove ReLU at classifier [:-1]
+    model.cluster_layer = None
+    model.category_layer = None
+
+    print('TEST set: Cluster the features')
+    features_te_unbal, input_tensors_te_unbal, labels_te_unbal = compute_features(dataloader_test_unbal, model, len(dataset_test_unbal),
+                                                                device=device, args=args)
+    clustering_loss_te_unbal, pca_features_te_unbal = deepcluster.cluster(features_te_unbal, verbose=args.verbose)
+
+    mlp = list(model.classifier.children()) # classifier that ends with linear(512 * 128). No ReLU at the end
+    mlp.append(nn.ReLU(inplace=True).to(device))
+    model.classifier = nn.Sequential(*mlp)
+    model.classifier.to(device)
+
+    # nan_location_unbal = np.isnan(pca_features_te_unbal)
+    # inf_location_unbal = np.isinf(pca_features_te_unbal)
+    # if (not np.allclose(nan_location_unbal, 0)) or (not np.allclose(inf_location_unbal, 0)):
+    #     print('PCA: Feature NaN or Inf found. Nan count: ', np.sum(nan_location_unbal), ' Inf count: ',
+    #           np.sum(inf_location_unbal))
+    #     print('Skip epoch ', epoch)
+    #     torch.save(pca_features_te_unbal, 'te_pca_NaN_%d_unbal.pth.tar' % epoch)
+    #     torch.save(features_te_unbal, 'te_feature_NaN_%d_unbal.pth.tar' % epoch)
+    #     continue
+
+    # save patches per epochs
+    cp_epoch_out_unbal = [features_te_unbal, deepcluster.images_lists, deepcluster.images_dist_lists, input_tensors_te_unbal,
+                    labels_te_unbal]
+
+    with open(os.path.join(args.exp, 'unbal', 'features', 'cp_epoch_%d_te_unbal.pickle' % epoch), "wb") as f:
+        pickle.dump(cp_epoch_out_unbal, f)
+    with open(os.path.join(args.exp, 'unbal', 'pca_features', 'pca_epoch_%d_te_unbal.pickle' % epoch), "wb") as f:
+        pickle.dump(pca_features_te_unbal, f)
+    return 0
+
 def main(args):
     # fix random seeds
     torch.manual_seed(args.seed)
@@ -418,6 +488,16 @@ def main(args):
     model.category_layer = model.category_layer.double()
     model.category_layer.to(device)
 
+    '''
+    ############################
+    ############################
+    # EarlyStopping (test_accuracy_bal, 100)
+    ############################
+    ############################
+    '''
+    early_stopping = EarlyStopping(model, **stopping_args)
+    stop_vars = []
+
     if args.optimizer is 'Adam':
         print('Adam optimizer: conv')
         optimizer_category = torch.optim.Adam(
@@ -531,7 +611,7 @@ def main(args):
     MAIN TRAINING
     #######################
     #######################'''
-    for epoch in range(args.start_epoch, args.epochs):
+    for epoch in range(args.start_epoch, early_stopping.max_epochs):
         end = time.time()
         print('#####################  Start training at Epoch %d ################'% epoch)
         model.classifier = nn.Sequential(*list(model.classifier.children())[:-1]) # remove ReLU at classifier [:-1]
@@ -693,92 +773,95 @@ def main(args):
         with open(os.path.join(args.exp, 'loss_collect.pickle'), "wb") as f:
             pickle.dump(loss_collect, f)
 
-        '''
-        ############################
-        ############################
-        # PSEUDO-LABEL GEN: Test set (balanced UA)
-        ############################
-        ############################
-        '''
-        model.classifier = nn.Sequential(*list(model.classifier.children())[:-1]) # remove ReLU at classifier [:-1]
-        model.cluster_layer = None
-        model.category_layer = None
-
-        print('TEST set: Cluster the features')
-        features_te_bal, input_tensors_te_bal, labels_te_bal = compute_features(dataloader_test_bal, model, len(dataset_test_bal),
-                                                                    device=device, args=args)
-        clustering_loss_te_bal, pca_features_te_bal = deepcluster.cluster(features_te_bal, verbose=args.verbose)
-
-        mlp = list(model.classifier.children()) # classifier that ends with linear(512 * 128). No ReLU at the end
-        mlp.append(nn.ReLU(inplace=True).to(device))
-        model.classifier = nn.Sequential(*mlp)
-        model.classifier.to(device)
-
-        nan_location_bal = np.isnan(pca_features_te_bal)
-        inf_location_bal = np.isinf(pca_features_te_bal)
-        if (not np.allclose(nan_location_bal, 0)) or (not np.allclose(inf_location_bal, 0)):
-            print('PCA: Feature NaN or Inf found. Nan count: ', np.sum(nan_location_bal), ' Inf count: ',
-                  np.sum(inf_location_bal))
-            print('Skip epoch ', epoch)
-            torch.save(pca_features_te_bal, 'te_pca_NaN_%d_bal.pth.tar' % epoch)
-            torch.save(features_te_bal, 'te_feature_NaN_%d_bal.pth.tar' % epoch)
-            continue
-
-        # save patches per epochs
-        cp_epoch_out_bal = [features_te_bal, deepcluster.images_lists, deepcluster.images_dist_lists, input_tensors_te_bal,
-                        labels_te_bal]
+        if (epoch % args.save_epoch == 0):
+            out = produce_test_result_bal(epoch, model, dataloader_test_bal, dataset_test_bal, device, args, deepcluster)
+            out = produce_test_result_unbal(epoch, model, dataloader_test_unbal, dataset_test_unbal, device, args, deepcluster)
 
+        '''EarlyStopping'''
+        if early_stopping.check(loss_collect[7], epoch):
+            break
 
-        if (epoch % args.save_epoch == 0):
-            with open(os.path.join(args.exp, 'bal', 'features', 'cp_epoch_%d_te_bal.pickle' % epoch), "wb") as f:
-                pickle.dump(cp_epoch_out_bal, f)
-            with open(os.path.join(args.exp, 'bal', 'pca_features',  'pca_epoch_%d_te_bal.pickle' % epoch), "wb") as f:
-                pickle.dump(pca_features_te_bal, f)
+    out = produce_test_result_bal(epoch, model, dataloader_test_bal, dataset_test_bal, device, args, deepcluster)
+    out = produce_test_result_unbal(epoch, model, dataloader_test_unbal, dataset_test_unbal, device, args,
+                                        deepcluster)
 
 
         '''
         ############################
         ############################
-        # PSEUDO-LABEL GEN: Test set (Unbalanced UA)
+        # PSEUDO-LABEL GEN: Test set (balanced UA)
         ############################
         ############################
         '''
-        model.classifier = nn.Sequential(*list(model.classifier.children())[:-1]) # remove ReLU at classifier [:-1]
-        model.cluster_layer = None
-        model.category_layer = None
-
-        print('TEST set: Cluster the features')
-        features_te_unbal, input_tensors_te_unbal, labels_te_unbal = compute_features(dataloader_test_unbal, model, len(dataset_test_unbal),
-                                                                    device=device, args=args)
-        clustering_loss_te_unbal, pca_features_te_unbal = deepcluster.cluster(features_te_unbal, verbose=args.verbose)
-
-        mlp = list(model.classifier.children()) # classifier that ends with linear(512 * 128). No ReLU at the end
-        mlp.append(nn.ReLU(inplace=True).to(device))
-        model.classifier = nn.Sequential(*mlp)
-        model.classifier.to(device)
-
-        nan_location_unbal = np.isnan(pca_features_te_unbal)
-        inf_location_unbal = np.isinf(pca_features_te_unbal)
-        if (not np.allclose(nan_location_unbal, 0)) or (not np.allclose(inf_location_unbal, 0)):
-            print('PCA: Feature NaN or Inf found. Nan count: ', np.sum(nan_location_unbal), ' Inf count: ',
-                  np.sum(inf_location_unbal))
-            print('Skip epoch ', epoch)
-            torch.save(pca_features_te_unbal, 'te_pca_NaN_%d_unbal.pth.tar' % epoch)
-            torch.save(features_te_unbal, 'te_feature_NaN_%d_unbal.pth.tar' % epoch)
-            continue
-
-        # save patches per epochs
-        cp_epoch_out_unbal = [features_te_unbal, deepcluster.images_lists, deepcluster.images_dist_lists, input_tensors_te_unbal,
-                        labels_te_unbal]
 
+def produce_test_result_bal(epoch, model, dataloader_test_bal, dataset_test_bal, device, args, deepcluster):
+    model.classifier = nn.Sequential(*list(model.classifier.children())[:-1]) # remove ReLU at classifier [:-1]
+    model.cluster_layer = None
+    model.category_layer = None
 
-        if (epoch % args.save_epoch == 0):
-            with open(os.path.join(args.exp, 'unbal', 'features', 'cp_epoch_%d_te_unbal.pickle' % epoch), "wb") as f:
-                pickle.dump(cp_epoch_out_unbal, f)
-            with open(os.path.join(args.exp, 'unbal', 'pca_features', 'pca_epoch_%d_te_unbal.pickle' % epoch), "wb") as f:
-                pickle.dump(pca_features_te_unbal, f)
-
+    print('TEST set: Cluster the features')
+    features_te_bal, input_tensors_te_bal, labels_te_bal = compute_features(dataloader_test_bal, model, len(dataset_test_bal),
+                                                                device=device, args=args)
+    clustering_loss_te_bal, pca_features_te_bal = deepcluster.cluster(features_te_bal, verbose=args.verbose)
+
+    mlp = list(model.classifier.children()) # classifier that ends with linear(512 * 128). No ReLU at the end
+    mlp.append(nn.ReLU(inplace=True).to(device))
+    model.classifier = nn.Sequential(*mlp)
+    model.classifier.to(device)
+
+    # nan_location_bal = np.isnan(pca_features_te_bal)
+    # inf_location_bal = np.isinf(pca_features_te_bal)
+    # if (not np.allclose(nan_location_bal, 0)) or (not np.allclose(inf_location_bal, 0)):
+    #     print('PCA: Feature NaN or Inf found. Nan count: ', np.sum(nan_location_bal), ' Inf count: ',
+    #           np.sum(inf_location_bal))
+    #     print('Skip epoch ', epoch)
+    #     torch.save(pca_features_te_bal, 'te_pca_NaN_%d_bal.pth.tar' % epoch)
+    #     torch.save(features_te_bal, 'te_feature_NaN_%d_bal.pth.tar' % epoch)
+    #     continue
+
+    # save patches per epochs
+    cp_epoch_out_bal = [features_te_bal, deepcluster.images_lists, deepcluster.images_dist_lists, input_tensors_te_bal,
+                    labels_te_bal]
+    with open(os.path.join(args.exp, 'bal', 'features', 'cp_epoch_%d_te_bal.pickle' % epoch), "wb") as f:
+        pickle.dump(cp_epoch_out_bal, f)
+    with open(os.path.join(args.exp, 'bal', 'pca_features',  'pca_epoch_%d_te_bal.pickle' % epoch), "wb") as f:
+        pickle.dump(pca_features_te_bal, f)
+    return 0
+
+def produce_test_result_unbal(epoch, model, dataloader_test_unbal, dataset_test_unbal, device, args, deepcluster):
+    model.classifier = nn.Sequential(*list(model.classifier.children())[:-1]) # remove ReLU at classifier [:-1]
+    model.cluster_layer = None
+    model.category_layer = None
 
+    print('TEST set: Cluster the features')
+    features_te_unbal, input_tensors_te_unbal, labels_te_unbal = compute_features(dataloader_test_unbal, model, len(dataset_test_unbal),
+                                                                device=device, args=args)
+    clustering_loss_te_unbal, pca_features_te_unbal = deepcluster.cluster(features_te_unbal, verbose=args.verbose)
+
+    mlp = list(model.classifier.children()) # classifier that ends with linear(512 * 128). No ReLU at the end
+    mlp.append(nn.ReLU(inplace=True).to(device))
+    model.classifier = nn.Sequential(*mlp)
+    model.classifier.to(device)
+
+    # nan_location_unbal = np.isnan(pca_features_te_unbal)
+    # inf_location_unbal = np.isinf(pca_features_te_unbal)
+    # if (not np.allclose(nan_location_unbal, 0)) or (not np.allclose(inf_location_unbal, 0)):
+    #     print('PCA: Feature NaN or Inf found. Nan count: ', np.sum(nan_location_unbal), ' Inf count: ',
+    #           np.sum(inf_location_unbal))
+    #     print('Skip epoch ', epoch)
+    #     torch.save(pca_features_te_unbal, 'te_pca_NaN_%d_unbal.pth.tar' % epoch)
+    #     torch.save(features_te_unbal, 'te_feature_NaN_%d_unbal.pth.tar' % epoch)
+    #     continue
+
+    # save patches per epochs
+    cp_epoch_out_unbal = [features_te_unbal, deepcluster.images_lists, deepcluster.images_dist_lists, input_tensors_te_unbal,
+                    labels_te_unbal]
+
+    with open(os.path.join(args.exp, 'unbal', 'features', 'cp_epoch_%d_te_unbal.pickle' % epoch), "wb") as f:
+        pickle.dump(cp_epoch_out_unbal, f)
+    with open(os.path.join(args.exp, 'unbal', 'pca_features', 'pca_epoch_%d_te_unbal.pickle' % epoch), "wb") as f:
+        pickle.dump(pca_features_te_unbal, f)
+    return 0
 
 if __name__ == '__main__':
     args = parse_args()