test /test_example_concept_learning_neural_evaluation.py removed for now

dice-group · Nov 11, 2024 · 882f512 · 882f512
1 parent 01eccb6
commit 882f512
Showing 1 changed file with 173 additions and 173 deletions.
diff --git a/tests/test_example_concept_learning_neural_evaluation.py b/tests/test_example_concept_learning_neural_evaluation.py
@@ -8,28 +8,28 @@
 
 """
 
-import json
-import time
-import os
-import subprocess
-import platform
-import pandas as pd
-from ontolearn.knowledge_base import KnowledgeBase
-from ontolearn.learners import CELOE, OCEL, Drill, TDL
-from ontolearn.concept_learner import EvoLearner, NCES, CLIP
-from ontolearn.refinement_operators import ExpressRefinement
-from ontolearn.learning_problem import PosNegLPStandard
-from ontolearn.metrics import F1
-from owlapy.owl_individual import OWLNamedIndividual, IRI
-import argparse
-from sklearn.model_selection import StratifiedKFold
-import numpy as np
-from ontolearn.utils.static_funcs import compute_f1_score
-from ontolearn.triple_store import TripleStore
-from ontolearn.owl_neural_reasoner import TripleStoreNeuralReasoner
-from owlapy import owl_expression_to_dl
-
-pd.set_option("display.precision", 5)
+# import json
+# import time
+# import os
+# import subprocess
+# import platform
+# import pandas as pd
+# from ontolearn.knowledge_base import KnowledgeBase
+# from ontolearn.learners import CELOE, OCEL, Drill, TDL
+# from ontolearn.concept_learner import EvoLearner, NCES, CLIP
+# from ontolearn.refinement_operators import ExpressRefinement
+# from ontolearn.learning_problem import PosNegLPStandard
+# from ontolearn.metrics import F1
+# from owlapy.owl_individual import OWLNamedIndividual, IRI
+# import argparse
+# from sklearn.model_selection import StratifiedKFold
+# import numpy as np
+# from ontolearn.utils.static_funcs import compute_f1_score
+# from ontolearn.triple_store import TripleStore
+# from ontolearn.owl_neural_reasoner import TripleStoreNeuralReasoner
+# from owlapy import owl_expression_to_dl
+
+# pd.set_option("display.precision", 5)
 
 """
 Regression Test for the example.
@@ -42,154 +42,154 @@
 python examples/concept_learning_evaluation.py --lps LPs/Family/lps.json --kb KGs/Family/family-benchmark_rich_background.owl --max_runtime 3 --report family.csv
 
 """
-import json
-import time
-import os
-import subprocess
-import platform
-import pandas as pd
-from ontolearn.knowledge_base import KnowledgeBase
-from ontolearn.learners import CELOE, OCEL, Drill, TDL
-from ontolearn.concept_learner import EvoLearner, NCES, CLIP
-from ontolearn.refinement_operators import ExpressRefinement
-from ontolearn.learning_problem import PosNegLPStandard
-from ontolearn.metrics import F1
-from owlapy.owl_individual import OWLNamedIndividual, IRI
-import argparse
-from sklearn.model_selection import StratifiedKFold
-import numpy as np
-from ontolearn.utils.static_funcs import compute_f1_score
-from ontolearn.triple_store import TripleStore
-from ontolearn.owl_neural_reasoner import TripleStoreNeuralReasoner
-from owlapy import owl_expression_to_dl
-
-pd.set_option("display.precision", 5)
-
-class TestConceptLearningCV:
-    def test_cv(self):
-
-        with open('LPs/Family/lps.json') as json_file:
-            settings = json.load(json_file)
-
-        path_kb="KGs/Family/family-benchmark_rich_background.owl"
-        max_runtime=1
-        random_seed=1
-        folds=2
-
-        from dicee.executer import Execute
-        from dicee.config import Namespace
-        args = Namespace()
-        args.model = 'Keci'
-        args.scoring_technique = "KvsAll"  # 1vsAll, or AllvsAll, or NegSample
-        args.path_single_kg = path_kb
-        args.path_to_store_single_run = "KeciFamilyRun"
-        args.backend="rdflib"
-        Execute(args).start()
-        path_kge=args.path_to_store_single_run
-
-        kb = KnowledgeBase(path=path_kb)
-        drill_with_symbolic_retriever = Drill(knowledge_base=kb,
-                                              quality_func=F1(), max_runtime=max_runtime,verbose=0)
-        neural_kb = TripleStore(reasoner=TripleStoreNeuralReasoner(path_neural_embedding=path_kge))
-        drill_with_neural_retriever = Drill(knowledge_base=neural_kb,
-                                            quality_func=F1(), max_runtime=max_runtime, verbose=0)
-
-        # dictionary to store the data
-        data = dict()
-        if "problems" in settings:
-            problems = settings["problems"].items()
-            positives_key = "positive_examples"
-            negatives_key = "negative_examples"
-        else:
-            problems = settings.items()
-            positives_key = "positive examples"
-            negatives_key = "negative examples"
-
-        for str_target_concept, examples in problems:
-            print("Target concept: ", str_target_concept)
-            p = examples[positives_key]
-            n = examples[negatives_key]
-
-            kf = StratifiedKFold(n_splits=folds, shuffle=True, random_state=random_seed)
-            X = np.array(p + n)
-            y = np.array([1.0 for _ in p] + [0.0 for _ in n])
-
-            for ith, (train_index, test_index) in enumerate(kf.split(X, y)):
-                #
-                data.setdefault("LP", []).append(str_target_concept)
-                data.setdefault("Fold", []).append(ith)
-                # () Extract positive and negative examples from train fold
-                train_pos = {pos_individual for pos_individual in X[train_index][y[train_index] == 1]}
-                train_neg = {neg_individual for neg_individual in X[train_index][y[train_index] == 0]}
-
-                # Sanity checking for individuals used for training.
-                assert train_pos.issubset(examples[positives_key])
-                assert train_neg.issubset(examples[negatives_key])
-
-                # () Extract positive and negative examples from test fold
-                test_pos = {pos_individual for pos_individual in X[test_index][y[test_index] == 1]}
-                test_neg = {neg_individual for neg_individual in X[test_index][y[test_index] == 0]}
-
-                # Sanity checking for individuals used for testing.
-                assert test_pos.issubset(examples[positives_key])
-                assert test_neg.issubset(examples[negatives_key])
-                train_lp = PosNegLPStandard(
-                    pos={OWLNamedIndividual(i) for i in train_pos},
-                    neg={OWLNamedIndividual(i) for i in train_neg})
-
-                test_lp = PosNegLPStandard(
-                    pos={OWLNamedIndividual(i) for i in test_pos},
-                    neg={OWLNamedIndividual(i) for i in test_neg})
-                print("DRILL Symbolic starts..", end=" ")
-                start_time = time.time()
-                # Prediction of DRILL through symbolic retriever.
-                pred_symbolic_drill = drill_with_symbolic_retriever.fit(train_lp).best_hypotheses()
-                symbolic_rt_drill = time.time() - start_time
-                print("DRILL Symbolic ends..", end="\t")
-                # Quality of prediction through symbolic retriever on the train split.
-                symbolic_train_f1_drill = compute_f1_score(
-                    individuals=frozenset({i for i in kb.individuals(pred_symbolic_drill)}),
-                    pos=train_lp.pos,
-                    neg=train_lp.neg)
-                # Quality of prediction through symbolic retriever on the test split.
-                symbolic_test_f1_drill = compute_f1_score(
-                    individuals=frozenset({i for i in kb.individuals(pred_symbolic_drill)}),
-                    pos=test_lp.pos,
-                    neg=test_lp.neg)
-                print(f"DRILL Symbolic Train Quality: {symbolic_train_f1_drill:.3f}", end="\t")
-                print(f"DRILL Symbolic Test Quality: {symbolic_test_f1_drill:.3f}", end="\t")
-                print(f"DRILL Symbolic Runtime: {symbolic_rt_drill:.3f}", end="\t")
-                print(f"Prediction: {owl_expression_to_dl(pred_symbolic_drill)}")
-                data.setdefault("Train-F1-Symbolic-DRILL", []).append(symbolic_train_f1_drill)
-                data.setdefault("Test-F1-Symbolic-DRILL", []).append(symbolic_test_f1_drill)
-                data.setdefault("RT-Symbolic-DRILL", []).append(symbolic_rt_drill)
-                data.setdefault("Prediction-Symbolic-DRILL", []).append(owl_expression_to_dl(pred_symbolic_drill))
-
-                print("DRILL Neural starts..", end=" ")
-                start_time = time.time()
-                # Prediction of DRILL through symbolic retriever.
-                pred_neural_drill = drill_with_neural_retriever.fit(train_lp).best_hypotheses()
-                neural_rt_drill = time.time() - start_time
-                print("DRILL Neural ends..", end="\t")
-                # Quality of prediction through symbolic retriever on the train split.
-                neural_train_f1_drill = compute_f1_score(
-                    individuals=frozenset({i for i in neural_kb.individuals(pred_neural_drill)}),
-                    pos=train_lp.pos,
-                    neg=train_lp.neg)
-                # Quality of prediction through symbolic retriever on the test split.
-                neural_test_f1_drill = compute_f1_score(
-                    individuals=frozenset({i for i in neural_kb.individuals(pred_neural_drill)}),
-                    pos=test_lp.pos,
-                    neg=test_lp.neg)
-                print(f"DRILL Neural Train Quality: {neural_train_f1_drill:.3f}", end="\t")
-                print(f"DRILL Neural Test Quality: {neural_test_f1_drill:.3f}", end="\t")
-                print(f"DRILL Neural Runtime: {neural_rt_drill:.3f}", end="\t")
-                print(f"Prediction: {owl_expression_to_dl(pred_neural_drill)}")
-
-                data.setdefault("Train-F1-Neural-DRILL", []).append(neural_train_f1_drill)
-                data.setdefault("Test-F1-Neural-DRILL", []).append(neural_test_f1_drill)
-                data.setdefault("RT-Neural-DRILL", []).append(neural_rt_drill)
-                data.setdefault("Prediction-Neural-DRILL", []).append(owl_expression_to_dl(pred_neural_drill))
-
-        df = pd.DataFrame.from_dict(data)
-        assert df.select_dtypes(include="number").mean()["Train-F1-Symbolic-DRILL"] >= 0.93
+# import json
+# import time
+# import os
+# import subprocess
+# import platform
+# import pandas as pd
+# from ontolearn.knowledge_base import KnowledgeBase
+# from ontolearn.learners import CELOE, OCEL, Drill, TDL
+# from ontolearn.concept_learner import EvoLearner, NCES, CLIP
+# from ontolearn.refinement_operators import ExpressRefinement
+# from ontolearn.learning_problem import PosNegLPStandard
+# from ontolearn.metrics import F1
+# from owlapy.owl_individual import OWLNamedIndividual, IRI
+# import argparse
+# from sklearn.model_selection import StratifiedKFold
+# import numpy as np
+# from ontolearn.utils.static_funcs import compute_f1_score
+# from ontolearn.triple_store import TripleStore
+# from ontolearn.owl_neural_reasoner import TripleStoreNeuralReasoner
+# from owlapy import owl_expression_to_dl
+
+# pd.set_option("display.precision", 5)
+
+# class TestConceptLearningCV:
+#     def test_cv(self):
+
+#         with open('LPs/Family/lps.json') as json_file:
+#             settings = json.load(json_file)
+
+#         path_kb="KGs/Family/family-benchmark_rich_background.owl"
+#         max_runtime=1
+#         random_seed=1
+#         folds=2
+
+#         from dicee.executer import Execute
+#         from dicee.config import Namespace
+#         args = Namespace()
+#         args.model = 'Keci'
+#         args.scoring_technique = "KvsAll"  # 1vsAll, or AllvsAll, or NegSample
+#         args.path_single_kg = path_kb
+#         args.path_to_store_single_run = "KeciFamilyRun"
+#         args.backend="rdflib"
+#         Execute(args).start()
+#         path_kge=args.path_to_store_single_run
+
+#         kb = KnowledgeBase(path=path_kb)
+#         drill_with_symbolic_retriever = Drill(knowledge_base=kb,
+#                                               quality_func=F1(), max_runtime=max_runtime,verbose=0)
+#         neural_kb = TripleStore(reasoner=TripleStoreNeuralReasoner(path_neural_embedding=path_kge))
+#         drill_with_neural_retriever = Drill(knowledge_base=neural_kb,
+#                                             quality_func=F1(), max_runtime=max_runtime, verbose=0)
+
+#         # dictionary to store the data
+#         data = dict()
+#         if "problems" in settings:
+#             problems = settings["problems"].items()
+#             positives_key = "positive_examples"
+#             negatives_key = "negative_examples"
+#         else:
+#             problems = settings.items()
+#             positives_key = "positive examples"
+#             negatives_key = "negative examples"
+
+#         for str_target_concept, examples in problems:
+#             print("Target concept: ", str_target_concept)
+#             p = examples[positives_key]
+#             n = examples[negatives_key]
+
+#             kf = StratifiedKFold(n_splits=folds, shuffle=True, random_state=random_seed)
+#             X = np.array(p + n)
+#             y = np.array([1.0 for _ in p] + [0.0 for _ in n])
+
+#             for ith, (train_index, test_index) in enumerate(kf.split(X, y)):
+#                 #
+#                 data.setdefault("LP", []).append(str_target_concept)
+#                 data.setdefault("Fold", []).append(ith)
+#                 # () Extract positive and negative examples from train fold
+#                 train_pos = {pos_individual for pos_individual in X[train_index][y[train_index] == 1]}
+#                 train_neg = {neg_individual for neg_individual in X[train_index][y[train_index] == 0]}
+
+#                 # Sanity checking for individuals used for training.
+#                 assert train_pos.issubset(examples[positives_key])
+#                 assert train_neg.issubset(examples[negatives_key])
+
+#                 # () Extract positive and negative examples from test fold
+#                 test_pos = {pos_individual for pos_individual in X[test_index][y[test_index] == 1]}
+#                 test_neg = {neg_individual for neg_individual in X[test_index][y[test_index] == 0]}
+
+#                 # Sanity checking for individuals used for testing.
+#                 assert test_pos.issubset(examples[positives_key])
+#                 assert test_neg.issubset(examples[negatives_key])
+#                 train_lp = PosNegLPStandard(
+#                     pos={OWLNamedIndividual(i) for i in train_pos},
+#                     neg={OWLNamedIndividual(i) for i in train_neg})
+
+#                 test_lp = PosNegLPStandard(
+#                     pos={OWLNamedIndividual(i) for i in test_pos},
+#                     neg={OWLNamedIndividual(i) for i in test_neg})
+#                 print("DRILL Symbolic starts..", end=" ")
+#                 start_time = time.time()
+#                 # Prediction of DRILL through symbolic retriever.
+#                 pred_symbolic_drill = drill_with_symbolic_retriever.fit(train_lp).best_hypotheses()
+#                 symbolic_rt_drill = time.time() - start_time
+#                 print("DRILL Symbolic ends..", end="\t")
+#                 # Quality of prediction through symbolic retriever on the train split.
+#                 symbolic_train_f1_drill = compute_f1_score(
+#                     individuals=frozenset({i for i in kb.individuals(pred_symbolic_drill)}),
+#                     pos=train_lp.pos,
+#                     neg=train_lp.neg)
+#                 # Quality of prediction through symbolic retriever on the test split.
+#                 symbolic_test_f1_drill = compute_f1_score(
+#                     individuals=frozenset({i for i in kb.individuals(pred_symbolic_drill)}),
+#                     pos=test_lp.pos,
+#                     neg=test_lp.neg)
+#                 print(f"DRILL Symbolic Train Quality: {symbolic_train_f1_drill:.3f}", end="\t")
+#                 print(f"DRILL Symbolic Test Quality: {symbolic_test_f1_drill:.3f}", end="\t")
+#                 print(f"DRILL Symbolic Runtime: {symbolic_rt_drill:.3f}", end="\t")
+#                 print(f"Prediction: {owl_expression_to_dl(pred_symbolic_drill)}")
+#                 data.setdefault("Train-F1-Symbolic-DRILL", []).append(symbolic_train_f1_drill)
+#                 data.setdefault("Test-F1-Symbolic-DRILL", []).append(symbolic_test_f1_drill)
+#                 data.setdefault("RT-Symbolic-DRILL", []).append(symbolic_rt_drill)
+#                 data.setdefault("Prediction-Symbolic-DRILL", []).append(owl_expression_to_dl(pred_symbolic_drill))
+
+#                 print("DRILL Neural starts..", end=" ")
+#                 start_time = time.time()
+#                 # Prediction of DRILL through symbolic retriever.
+#                 pred_neural_drill = drill_with_neural_retriever.fit(train_lp).best_hypotheses()
+#                 neural_rt_drill = time.time() - start_time
+#                 print("DRILL Neural ends..", end="\t")
+#                 # Quality of prediction through symbolic retriever on the train split.
+#                 neural_train_f1_drill = compute_f1_score(
+#                     individuals=frozenset({i for i in neural_kb.individuals(pred_neural_drill)}),
+#                     pos=train_lp.pos,
+#                     neg=train_lp.neg)
+#                 # Quality of prediction through symbolic retriever on the test split.
+#                 neural_test_f1_drill = compute_f1_score(
+#                     individuals=frozenset({i for i in neural_kb.individuals(pred_neural_drill)}),
+#                     pos=test_lp.pos,
+#                     neg=test_lp.neg)
+#                 print(f"DRILL Neural Train Quality: {neural_train_f1_drill:.3f}", end="\t")
+#                 print(f"DRILL Neural Test Quality: {neural_test_f1_drill:.3f}", end="\t")
+#                 print(f"DRILL Neural Runtime: {neural_rt_drill:.3f}", end="\t")
+#                 print(f"Prediction: {owl_expression_to_dl(pred_neural_drill)}")
+
+#                 data.setdefault("Train-F1-Neural-DRILL", []).append(neural_train_f1_drill)
+#                 data.setdefault("Test-F1-Neural-DRILL", []).append(neural_test_f1_drill)
+#                 data.setdefault("RT-Neural-DRILL", []).append(neural_rt_drill)
+#                 data.setdefault("Prediction-Neural-DRILL", []).append(owl_expression_to_dl(pred_neural_drill))
+
+#         df = pd.DataFrame.from_dict(data)
+#         assert df.select_dtypes(include="number").mean()["Train-F1-Symbolic-DRILL"] >= 0.93