Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add spenc as a lib rather than using via an import #93

Merged
merged 2 commits into from
Jan 11, 2021
Merged
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 0 additions & 1 deletion environment.yml
Original file line number Diff line number Diff line change
@@ -11,7 +11,6 @@ dependencies:
- geopandas>=0.7.0
- matplotlib
- scikit-learn=0.22
- spenc
- pytest
- pytest-cov
- pulp
85 changes: 43 additions & 42 deletions spopt/region/spenc.py
Original file line number Diff line number Diff line change
@@ -1,46 +1,47 @@
from ..BaseClass import BaseSpOptHeuristicSolver
import numpy as np
from warnings import warn
from spenc import SPENC
from .spenclib import SPENC


class Spenc(BaseSpOptHeuristicSolver):
"""
Spatially encouraged spectral clustering.
:cite:`wolf2018`
"""
def __init__(self, gdf, w, attrs_name, n_clusters=5, random_state=None, gamma=1):
"""
Parameters
----------
gdf : geopandas.GeoDataFrame
w : libpywal.weights.W instance
spatial weights matrix
attrs_name : list
Strings for attribute names (cols of ``geopandas.GeoDataFrame``).
n_clusters : int, optional, default: 5
The number of clusters to form.
gamma: int, default:1
"""
self.gdf = gdf
self.w = w
self.attrs_name = attrs_name
self.n_clusters = n_clusters
self.gamma = gamma
self.random_state = random_state

def solve(self):
"""Solve the spenc"""
data = self.gdf
X = data[self.attrs_name].values
#_import_tryer("spenc", "SPENC", "spenc")
model = SPENC(n_clusters=self.n_clusters, random_state=self.random_state, gamma=self.gamma)
model.fit(X, self.w.sparse)
self.labels_ = model.labels_
"""
Spatially encouraged spectral clustering.
:cite:`wolf2018`
"""

def __init__(self, gdf, w, attrs_name, n_clusters=5, random_state=None,
gamma=1):
"""
Parameters
----------
gdf : geopandas.GeoDataFrame
w : libpywal.weights.W instance
spatial weights matrix
attrs_name : list
Strings for attribute names (cols of ``geopandas.GeoDataFrame``).
n_clusters : int, optional, default: 5
The number of clusters to form.
gamma: int, default:1
"""
self.gdf = gdf
self.w = w
self.attrs_name = attrs_name
self.n_clusters = n_clusters
self.gamma = gamma
self.random_state = random_state

def solve(self):
"""Solve the spenc"""
data = self.gdf
X = data[self.attrs_name].values
model = SPENC(n_clusters=self.n_clusters,
random_state=self.random_state,
gamma=self.gamma)
model.fit(X, self.w.sparse)
self.labels_ = model.labels_
1 change: 1 addition & 0 deletions spopt/region/spenclib/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
from .abstracts import SPENC
604 changes: 604 additions & 0 deletions spopt/region/spenclib/abstracts.py

Large diffs are not rendered by default.

21 changes: 21 additions & 0 deletions spopt/region/spenclib/scores.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,21 @@
import numpy as np

def boundary_fraction(W, labels, X = None):
"""
"""
boundary = 0
for row, own_label in zip(W,labels):
neighbor_labels = labels[row.nonzero()[-1]]
boundary += (neighbor_labels != own_label).any().astype(int)
return boundary / W.shape[0]

def boundary_score(W, labels, X = None):
"""
Returns a version of boundary_fraction unbounded on the negative end using
the log of the fraction:
np.log(boundary_fraction(W, labels))
This is solely for testing purposes.
"""
return np.log(boundary_fraction(W, labels, X = None))
32 changes: 32 additions & 0 deletions spopt/region/spenclib/utils.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,32 @@
import scipy.sparse.csgraph as csg
import scipy.sparse as sp
from warnings import warn as Warn
import numpy as np

def check_weights(W, X=None, transform = None):
if X is not None:
assert W.shape[0] == X.shape[0], "W does not have the same number of samples as X"
graph = sp.csc_matrix(W)
graph.eliminate_zeros()
components, labels = csg.connected_components(graph)
if components > 1:
Warn('Spatial affinity matrix is disconnected, and has {} subcomponents.'
'This will certainly affect the solution output.')
return W

def lattice(x,y):
"""
Construct a lattice of unit squares of dimension (x,y)
"""
from shapely.geometry import Polygon
import geopandas as gpd
x = np.arange(x)*1.0
y = np.arange(y)*1.0
pgons = []
for i in x:
for j in y:
ll,lr,ur,ul = (i,j), (i+1,j),\
(i+1,j+1), (i,j+1)
#print([ll,lr,ur,ul])
pgons.append(Polygon([ll,lr,ur,ul]))
return gpd.GeoDataFrame({'geometry':pgons})