fix building extensions

Techtonique · Apr 25, 2024 · 04eddae · 04eddae
1 parent b2276fc
commit 04eddae
Show file tree

Hide file tree

Showing 17 changed files with 754 additions and 646 deletions.
diff --git a/CHANGES.md b/CHANGES.md
@@ -1,4 +1,4 @@
-# version 0.13.0
+# version 0.13.1
 
 - add clustering to `LSBoostRegressor`, `LSBoostClassifier`, and `AdaOpt`
 

diff --git a/Makefile b/Makefile
@@ -87,7 +87,7 @@ dist: clean ## builds source and wheel package
 	ls -l dist
 
 install: clean ## install the package to the active Python's site-packages
-	python3 -m pip install .
+	python3 -m pip install . --verbose
 
 run-examples: ## run all examples with one command
 	find examples -maxdepth 2 -name "*.py" -exec  python3 {} \;
diff --git a/examples/lsboost_regressor_pi.py b/examples/lsboost_regressor_pi.py
@@ -4,6 +4,9 @@
 
 print(f"\n ----- Running: {os.path.basename(__file__)}... ----- \n")
 
+print(os.path.dirname(
+    os.path.abspath(__file__)
+    ))
 
 subprocess.check_call([sys.executable, "-m", "pip", "install", "matplotlib"])
 

diff --git a/mlsauce/adaopt/_adaopt.py b/mlsauce/adaopt/_adaopt.py
@@ -7,13 +7,15 @@
 from numpy.linalg import norm
 from tqdm import tqdm
 from ..utils import subsample
-from ..utils import cluster 
+from ..utils import cluster
 
 try:
     from . import _adaoptc as adaoptc
 except ImportError:
-    pass
+    import pyximport
 
+    pyximport.install()
+    import _adaoptc as adaoptc
 
 class AdaOpt(BaseEstimator, ClassifierMixin):
     """AdaOpt classifier.
@@ -72,15 +74,15 @@ class AdaOpt(BaseEstimator, ClassifierMixin):
         cache: boolean
             if the nearest neighbors are cached or not, for faster retrieval in
             subsequent calls.
-        
+
         n_clusters_input: int
             number of clusters (a priori) for clustering the features
-        
+
         clustering_method: str
             clustering method: currently 'kmeans', 'gmm'
-        
+
         cluster_scaling: str
-            scaling method for clustering: currently 'standard', 'robust', 'minmax'    
+            scaling method for clustering: currently 'standard', 'robust', 'minmax'
 
         seed: int
             reproducibility seed for nodes_sim=='uniform', clustering and dropout.
@@ -104,12 +106,12 @@ def __init__(
         n_jobs=None,
         verbose=0,
         cache=True,
-        n_clusters_input = 0,
-        clustering_method = "kmeans",
-        cluster_scaling = "standard",
+        n_clusters_input=0,
+        clustering_method="kmeans",
+        cluster_scaling="standard",
         seed=123,
     ):
-        if n_clusters_input > 0: 
+        if n_clusters_input > 0:
             assert clustering_method in (
                 "kmeans",
                 "gmm",
@@ -145,7 +147,7 @@ def __init__(
         self.n_clusters_input = n_clusters_input
         self.clustering_method = clustering_method
         self.cluster_scaling = cluster_scaling
-        self.scaler_, self.label_encoder_, self.clusterer_ = None, None, None 
+        self.scaler_, self.label_encoder_, self.clusterer_ = None, None, None
         self.seed = seed
 
     def fit(self, X, y, **kwargs):
@@ -168,12 +170,17 @@ def fit(self, X, y, **kwargs):
 
         """
 
-        if self.n_clusters_input > 0: 
-            clustered_X, self.scaler_, self.label_encoder_, self.clusterer_ = cluster(X, n_clusters=self.n_clusters_input, 
-                method=self.clustering_method, 
-                type_scaling=self.cluster_scaling,
-                training=True, 
-                seed=self.seed)
+        if self.n_clusters_input > 0:
+            clustered_X, self.scaler_, self.label_encoder_, self.clusterer_ = (
+                cluster(
+                    X,
+                    n_clusters=self.n_clusters_input,
+                    method=self.clustering_method,
+                    type_scaling=self.cluster_scaling,
+                    training=True,
+                    seed=self.seed,
+                )
+            )
             X = np.column_stack((X.copy(), clustered_X))
 
         if self.row_sample < 1:
@@ -212,7 +219,7 @@ def fit(self, X, y, **kwargs):
         self.alphas = res["alphas"]
         self.n_iterations = res["n_iterations"]
         self.scaled_X_train = np.array(res["scaled_X_train"], dtype=np.float64)
-        self.n_classes_ = len(np.unique(y)) # for compatibility with sklearn 
+        self.n_classes_ = len(np.unique(y))  # for compatibility with sklearn
         return self
 
     def predict(self, X, **kwargs):
@@ -255,13 +262,19 @@ def predict_proba(self, X, **kwargs):
         n_train, p_train = self.scaled_X_train.shape
 
         if self.n_clusters_input > 0:
-            X = np.column_stack((X.copy(), cluster(
-                X, training=False, 
-                scaler=self.scaler_, 
-                label_encoder=self.label_encoder_, 
-                clusterer=self.clusterer_,
-                seed=self.seed
-            )))
+            X = np.column_stack(
+                (
+                    X.copy(),
+                    cluster(
+                        X,
+                        training=False,
+                        scaler=self.scaler_,
+                        label_encoder=self.label_encoder_,
+                        clusterer=self.clusterer_,
+                        seed=self.seed,
+                    ),
+                )
+            )
 
         n_test = X.shape[0]