5 жил өмнө · 970cb5c036
--- a/chillax/experiment_selfsupervised.py
+++ b/chillax/experiment_selfsupervised.py
@@ -26,7 +26,7 @@ def main():
 
															                 "augmentation": {},
														
 
															                 "trainer": {
														
 
															                     "name": "fast_single_shot",
														
 
															-                    "batch_size": 8,
														
 
															+                    "batch_size": 2,
														
 
															                     "inner_steps": 2000,
														
 
															                 },
														
 
															                 "feature_extractor": {"side_length": 448},
														
@@ -47,12 +47,19 @@ def main():
 
															     experiment_container = containers.ExperimentContainer(
														
 
															         config, observers=(CheapObserver(),)
														
 
															     )
														
 
															-    experiment_container.knowledge_base.observe_concepts(
														
 
															-        experiment_container.dataset.observable_concepts()
														
 
															-    )
														
 
															     dataset = experiment_container.dataset
														
 
															+    # Get prediction targets
														
 
															+    experiment_container.knowledge_base.add_prediction_targets(
														
 
															+        dataset.prediction_targets()
														
 
															+    )
														
 
															+
														
 
															+    # Add relation source
														
 
															+    experiment_container.knowledge_base.add_hyponymy_relation([dataset.get_hyponymy_relation_source()])
														
 
															+
														
 
															+    exit
														
 
															+
														
 
															     base_model = experiment_container.base_model
														
 
															     training_samples = dataset.train_pool(0, "label_gt")
														
 
															     base_model.observe(training_samples, "label_gt")
														
--- a/chillax/method.py
+++ b/chillax/method.py
@@ -1,5 +1,5 @@
 
															 from chia.v2.components.classifiers import keras_hierarchicalclassification
														
 
															-from chia.v2 import instrumentation
														
 
															+from chia.v2 import instrumentation, knowledge
														
 
															 import networkx as nx
														
 
															 import numpy as np
														
@@ -41,7 +41,7 @@ class CHILLAXKerasHC(
 
															         self.fc_layer = None
														
 
															         self.uid_to_dimension = {}
														
 
															         self.graph = None
														
 
															-        self.observed_uids = None
														
 
															+        self.prediction_target_uids = None
														
 
															         self.topo_sorted_uids = None
														
 
															         self.loss_weights = None
														
 
															         self.update_embedding()
														
@@ -107,7 +107,7 @@ class CHILLAXKerasHC(
 
															             if self._mlnp:
														
 
															                 for i, (uid, p) in enumerate(sorted_tuples):
														
 
															-                    if uid not in self.observed_uids:
														
 
															+                    if uid not in self.prediction_target_uids:
														
 
															                         sorted_tuples[i] = (uid, 0.0)
														
 
															             if self._normalize_scores:
														
@@ -117,12 +117,12 @@ class CHILLAXKerasHC(
 
															             return list(sorted_tuples)
														
 
															     def update_embedding(self):
														
 
															-        current_concepts = self.kb.all_concepts.values()
														
 
															+        current_concepts = self.kb.concepts()
														
 
															         current_concept_count = len(current_concepts)
														
 
															         self.report_metric("current_concepts", current_concept_count)
														
 
															         if current_concept_count == 0:
														
 
															-            return
														
 
															+            return True
														
 
															         try:
														
 
															             old_weights = self.fc_layer.get_weights()
														
@@ -146,20 +146,22 @@ class CHILLAXKerasHC(
 
															             bias_initializer="zero",
														
 
															         )
														
 
															-        # We need to reverse the graph for comfort because "is-a" has the concepts
														
 
															-        self.graph = self.kb.all_relations["hypernymy"]["graph"].reverse(copy=True)
														
 
															+        try:
														
 
															+            self.graph = self.kb.get_hyponymy_relation_rgraph()
														
 
															+        except ValueError:
														
 
															+            return False
														
 
															         # Memorize topological sorting for later
														
 
															         all_uids = nx.topological_sort(self.graph)
														
 
															         self.topo_sorted_uids = list(all_uids)
														
 
															-        assert len(self.kb.all_concepts) == len(self.topo_sorted_uids)
														
 
															+        assert len(current_concepts) == len(self.topo_sorted_uids)
														
 
															         self.uid_to_dimension = {
														
 
															             uid: dimension for dimension, uid in enumerate(self.topo_sorted_uids)
														
 
															         }
														
 
															-        self.observed_uids = {
														
 
															-            concept.data["uid"] for concept in self.kb.get_observed_concepts()
														
 
															+        self.prediction_target_uids = {
														
 
															+            concept.uid for concept in self.kb.concepts(flags={knowledge.ConceptFlagV2.PREDICTION_TARGET})
														
 
															         }
														
 
															         if len(old_weights) == 2:
														
@@ -189,9 +191,10 @@ class CHILLAXKerasHC(
 
															             self.fc_layer.set_weights([new_weights, new_biases])
														
 
															         self.update_loss_weights()
														
 
															+        return True
														
 
															     def update_loss_weights(self):
														
 
															-        if len(self.observed_uids) == 0:
														
 
															+        if len(self.prediction_target_uids) == 0:
														
 
															             self.log_debug("Skipping loss weight update, no concepts found.")
														
 
															             self.loss_weights = []
														
 
															             return
														
@@ -204,7 +207,7 @@ class CHILLAXKerasHC(
 
															         # (1) Calculate "natural" weights by assuming uniform distribution
														
 
															         # over observed concepts
														
 
															         occurences = {uid: 0 for uid in self.topo_sorted_uids}
														
 
															-        for uid in self.observed_uids:
														
 
															+        for uid in self.prediction_target_uids:
														
 
															             affected_uids = {uid}
														
 
															             affected_uids |= nx.ancestors(self.graph, uid)
														
 
															             for affected_uid in list(affected_uids):
														
@@ -254,7 +257,7 @@ class CHILLAXKerasHC(
 
															                 for i, uid in enumerate(self.uid_to_dimension):
														
 
															                     descendants = set(nx.descendants(self.graph, uid)) | {uid}
														
 
															-                    reachable_leaf_nodes = descendants.intersection(self.observed_uids)
														
 
															+                    reachable_leaf_nodes = descendants.intersection(self.prediction_target_uids)
														
 
															                     self.loss_weights[i] *= len(reachable_leaf_nodes)
														
 
															                     # Test if any leaf nodes are reachable
														
@@ -289,6 +292,10 @@ class CHILLAXKerasHC(
 
															         self.loss_weights /= gain
														
 
															     def loss(self, feature_batch, ground_truth):
														
 
															+        if not self.is_updated:
														
 
															+            raise RuntimeError("This classifier is not yet ready to compute a loss. "
														
 
															+                               "Check if it has been notified of a hyponymy relation.")
														
 
															+
														
 
															         loss_mask = np.zeros((len(ground_truth), len(self.uid_to_dimension)))
														
 
															         for i, label in enumerate(ground_truth):
														
 
															             # Loss mask
														
@@ -326,9 +333,7 @@ class CHILLAXKerasHC(
 
															         return tf.reduce_mean(sum_per_batch_element)
														
 
															     def observe(self, samples, gt_resource_id):
														
 
															-        if self.kb.get_concept_stamp() != self.last_observed_concept_stamp:
														
 
															-            self.update_embedding()
														
 
															-            self.last_observed_concept_stamp = self.kb.get_concept_stamp()
														
 
															+        self.maybe_update_embedding()
														
 
															     def regularization_losses(self):
														
 
															         return self.fc_layer.losses