Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Speed up the creation of submatrices of Matrix_modn_dense_template matrices #36059

Merged
merged 24 commits into from
Aug 27, 2023
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Jump to
Jump to file
Failed to load files.
Diff view
Diff view
4 changes: 1 addition & 3 deletions src/sage/matrix/matrix1.pyx
Original file line number Diff line number Diff line change
Expand Up @@ -2176,9 +2176,7 @@ cdef class Matrix(Matrix0):
[5 4]

For example here we take from row 1 columns 2 then 0 twice, and do
this 3 times.

::
this 3 times::

sage: A.matrix_from_rows_and_columns([1,1,1],[2,0,0])
[5 3 3]
Expand Down
8 changes: 4 additions & 4 deletions src/sage/matrix/matrix_integer_dense.pyx
Original file line number Diff line number Diff line change
Expand Up @@ -1614,7 +1614,7 @@ cdef class Matrix_integer_dense(Matrix_dense):
return self._mod_two()
elif p < MAX_MODULUS_FLOAT:
res_f = Matrix_modn_dense_float.__new__(Matrix_modn_dense_float,
matrix_space.MatrixSpace(IntegerModRing(p), self._nrows, self._ncols, sparse=False), None, None, None)
matrix_space.MatrixSpace(IntegerModRing(p), self._nrows, self._ncols, sparse=False), None, None, None, zeroed_alloc=False)
for i from 0 <= i < self._nrows:
res_row_f = res_f._matrix[i]
for j from 0 <= j < self._ncols:
Expand All @@ -1623,7 +1623,7 @@ cdef class Matrix_integer_dense(Matrix_dense):

elif p < MAX_MODULUS_DOUBLE:
res_d = Matrix_modn_dense_double.__new__(Matrix_modn_dense_double,
matrix_space.MatrixSpace(IntegerModRing(p), self._nrows, self._ncols, sparse=False), None, None, None)
matrix_space.MatrixSpace(IntegerModRing(p), self._nrows, self._ncols, sparse=False), None, None, None, zeroed_alloc=False)
for i from 0 <= i < self._nrows:
res_row_d = res_d._matrix[i]
for j from 0 <= j < self._ncols:
Expand All @@ -1649,11 +1649,11 @@ cdef class Matrix_integer_dense(Matrix_dense):
if p < MAX_MODULUS_FLOAT:
res.append( Matrix_modn_dense_float.__new__(Matrix_modn_dense_float,
matrix_space.MatrixSpace(IntegerModRing(p), self._nrows, self._ncols, sparse=False),
None, None, None) )
None, None, None, zeroed_alloc=False) )
elif p < MAX_MODULUS_DOUBLE:
res.append( Matrix_modn_dense_double.__new__(Matrix_modn_dense_double,
matrix_space.MatrixSpace(IntegerModRing(p), self._nrows, self._ncols, sparse=False),
None, None, None) )
None, None, None, zeroed_alloc=False) )
else:
raise ValueError("p=%d too big."%p)

Expand Down
193 changes: 160 additions & 33 deletions src/sage/matrix/matrix_modn_dense_template.pxi
Original file line number Diff line number Diff line change
Expand Up @@ -90,7 +90,7 @@ We test corner cases for multiplication::
from libc.stdint cimport uint64_t
from cpython.bytes cimport *

from cysignals.memory cimport check_malloc, check_allocarray, sig_malloc, sig_free
from cysignals.memory cimport check_malloc, check_allocarray, check_calloc, sig_malloc, sig_free
from cysignals.signals cimport sig_check, sig_on, sig_off

from sage.libs.gmp.mpz cimport *
Expand Down Expand Up @@ -123,7 +123,7 @@ from sage.structure.proof.proof import get_flag as get_proof_flag
from sage.structure.richcmp cimport rich_to_bool
from sage.misc.randstate cimport randstate, current_randstate
import sage.matrix.matrix_space as matrix_space
from .args cimport MatrixArgs_init
from .args cimport SparseEntry, MatrixArgs_init


from sage.cpython.string cimport char_to_str
Expand Down Expand Up @@ -441,15 +441,18 @@ cpdef __matrix_from_rows_of_matrices(X):


cdef class Matrix_modn_dense_template(Matrix_dense):
def __cinit__(self):
def __cinit__(self, *args, bint zeroed_alloc=True, **kwds):
cdef long p = self._base_ring.characteristic()
self.p = p
if p >= MAX_MODULUS:
raise OverflowError("p (=%s) must be < %s."%(p, MAX_MODULUS))

self._entries = <celement *>check_allocarray(self._nrows * self._ncols, sizeof(celement))
if zeroed_alloc:
self._entries = <celement *>check_calloc(self._nrows * self._ncols, sizeof(celement))
else:
self._entries = <celement *>check_allocarray(self._nrows * self._ncols, sizeof(celement))

self._matrix = <celement **>check_allocarray(self._nrows, sizeof(celement*))

cdef unsigned int k
cdef Py_ssize_t i
k = 0
Expand Down Expand Up @@ -518,27 +521,28 @@ cdef class Matrix_modn_dense_template(Matrix_dense):
"""
ma = MatrixArgs_init(parent, entries)
cdef long i, j
it = ma.iter(False)
it = ma.iter(convert=False, sparse=True)
R = ma.base
p = R.characteristic()
for i in range(ma.nrows):
v = self._matrix[i]
for j in range(ma.ncols):
x = next(it)
if type(x) is int:
tmp = (<long>x) % p
v[j] = tmp + (tmp<0)*p
elif type(x) is IntegerMod_int and (<IntegerMod_int>x)._parent is R:
v[j] = <celement>(<IntegerMod_int>x).ivalue
elif type(x) is Integer:
if coerce:
v[j] = mpz_fdiv_ui((<Integer>x).value, p)
else:
v[j] = mpz_get_ui((<Integer>x).value)
elif coerce:
v[j] = R(x)

for t in it:
se = <SparseEntry>t
x = se.entry
v = self._matrix[se.i]
if type(x) is int:
tmp = (<long>x) % p
v[se.j] = tmp + (tmp<0)*p
elif type(x) is IntegerMod_int and (<IntegerMod_int>x)._parent is R:
v[se.j] = <celement>(<IntegerMod_int>x).ivalue
elif type(x) is Integer:
if coerce:
v[se.j] = mpz_fdiv_ui((<Integer>x).value, p)
else:
v[j] = <celement>x
v[se.j] = mpz_get_ui((<Integer>x).value)
elif coerce:
v[se.j] = R(x)
else:
v[se.j] = <celement>x

cdef long _hash_(self) except -1:
"""
Expand Down Expand Up @@ -786,7 +790,7 @@ cdef class Matrix_modn_dense_template(Matrix_dense):
cdef Matrix_modn_dense_template M
cdef celement p = self.p

M = self.__class__.__new__(self.__class__, self._parent,None,None,None)
M = self.__class__.__new__(self.__class__, self._parent,None,None,None, zeroed_alloc=False)

sig_on()
for i in range(self._nrows*self._ncols):
Expand Down Expand Up @@ -825,7 +829,7 @@ cdef class Matrix_modn_dense_template(Matrix_dense):
cdef celement p = self.p
cdef celement a = left

M = self.__class__.__new__(self.__class__, self._parent,None,None,None)
M = self.__class__.__new__(self.__class__, self._parent,None,None,None,zeroed_alloc=False)

sig_on()
for i in range(self._nrows*self._ncols):
Expand All @@ -844,7 +848,7 @@ cdef class Matrix_modn_dense_template(Matrix_dense):
False
"""
cdef Matrix_modn_dense_template A
A = self.__class__.__new__(self.__class__, self._parent, 0, 0, 0)
A = self.__class__.__new__(self.__class__,self._parent,None,None,None,zeroed_alloc=False)
memcpy(A._entries, self._entries, sizeof(celement)*self._nrows*self._ncols)
if self._subdivisions is not None:
A.subdivide(*self.subdivisions())
Expand Down Expand Up @@ -883,7 +887,7 @@ cdef class Matrix_modn_dense_template(Matrix_dense):
cdef celement k, p
cdef Matrix_modn_dense_template M

M = self.__class__.__new__(self.__class__, self._parent,None,None,None)
M = self.__class__.__new__(self.__class__, self._parent,None,None,None,zeroed_alloc=False)
p = self.p
cdef celement* other_ent = (<Matrix_modn_dense_template>right)._entries

Expand Down Expand Up @@ -920,7 +924,7 @@ cdef class Matrix_modn_dense_template(Matrix_dense):
cdef celement k, p
cdef Matrix_modn_dense_template M

M = self.__class__.__new__(self.__class__, self._parent, None, None, None)
M = self.__class__.__new__(self.__class__, self._parent, None, None, None, zeroed_alloc=False)
p = self.p
cdef celement* other_ent = (<Matrix_modn_dense_template>right)._entries

Expand Down Expand Up @@ -3012,14 +3016,21 @@ cdef class Matrix_modn_dense_template(Matrix_dense):
if nrows == -1:
nrows = self._nrows - row

if col != 0 or ncols != self._ncols:
return self.matrix_from_rows_and_columns(range(row, row+nrows), range(col, col+ncols))

if nrows < 0 or row < 0 or row + nrows > self._nrows:
raise IndexError("rows out of range")
if ncols < 0 or col < 0 or col + ncols > self._ncols:
raise IndexError("columns out of range")

cdef Matrix_modn_dense_template M = self.new_matrix(nrows=nrows, ncols=ncols)

if col == 0 and ncols == self._ncols:
memcpy(M._entries, self._matrix[row], sizeof(celement)*ncols*nrows)
return M

cdef Py_ssize_t i,r
for i,r in enumerate(range(row, row+nrows)) :
memcpy(M._matrix[i], self._matrix[r]+col, sizeof(celement)*ncols)

cdef Matrix_modn_dense_template M = self.new_matrix(nrows=nrows, ncols=self._ncols)
memcpy(M._entries, self._entries+row*ncols, sizeof(celement)*ncols*nrows)
Comment on lines -3021 to -3022
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

These two lines could be kept, under a condition if col == 0 and ncols == self._ncols. This would make the copying a bit faster (singly memcpy) in this situation where one wants to retrieve a (contiguous) block of complete rows.

return M

def _matrices_from_rows(self, Py_ssize_t nrows, Py_ssize_t ncols):
Expand Down Expand Up @@ -3065,6 +3076,122 @@ cdef class Matrix_modn_dense_template(Matrix_dense):
ans.append(M)
return ans

def matrix_from_columns(self, columns):
"""
Return the matrix constructed from self using columns with indices
in the columns list.

EXAMPLES::

sage: M = MatrixSpace(Integers(8),3,3)
sage: A = M(range(9)); A
[0 1 2]
[3 4 5]
[6 7 0]
sage: A.matrix_from_columns([2,1])
[2 1]
[5 4]
[0 7]
"""
cdef Py_ssize_t ncols = len(columns)

# Construct new matrix
cdef Matrix_modn_dense_template A = self.new_matrix(ncols=ncols)
cdef Py_ssize_t i, j, col
for j, col in enumerate(columns):
if col < 0 or col >= self._ncols:
raise IndexError("column index out of range")
for i in range(self._nrows):
A._matrix[i][j] = self._matrix[i][col]

return A

def matrix_from_rows(self, rows):
"""
Return the matrix constructed from self using rows with indices in
the rows list.

EXAMPLES::

sage: M = MatrixSpace(Integers(8),3,3)
sage: A = M(range(9)); A
[0 1 2]
[3 4 5]
[6 7 0]
sage: A.matrix_from_rows([2,1])
[6 7 0]
[3 4 5]
"""
cdef Py_ssize_t nrows = len(rows)

# Construct new matrix
cdef Matrix_modn_dense_template A = self.new_matrix(nrows=nrows)

cdef Py_ssize_t i, row
for i, row in enumerate(rows):
if row < 0 or row >= self._nrows:
raise IndexError("row index out of range")
memcpy(A._matrix[i], self._matrix[row], sizeof(celement)*self._ncols)

return A

def matrix_from_rows_and_columns(self, rows, columns):
"""
Return the matrix constructed from self from the given rows and
columns.

EXAMPLES::

sage: M = MatrixSpace(Integers(8),3,3)
sage: A = M(range(9)); A
[0 1 2]
[3 4 5]
[6 7 0]
sage: A.matrix_from_rows_and_columns([1], [0,2])
[3 5]
sage: A.matrix_from_rows_and_columns([1,2], [1,2])
[4 5]
[7 0]

Note that row and column indices can be reordered or repeated::

sage: A.matrix_from_rows_and_columns([2,1], [2,1])
[0 7]
[5 4]

For example here we take from row 1 columns 2 then 0 twice, and do
this 3 times::

sage: A.matrix_from_rows_and_columns([1,1,1],[2,0,0])
[5 3 3]
[5 3 3]
[5 3 3]

AUTHORS:

- Jaap Spies (2006-02-18)

- Didier Deshommes: some Pyrex speedups implemented
"""
cdef Py_ssize_t ncols = len(columns)
cdef Py_ssize_t nrows = len(rows)

# Check whether column indices are valid
cdef Py_ssize_t i, j, row, col
for col in columns:
if col < 0 or col >= self._ncols:
raise IndexError("column index out of range")

# Construct new matrix
cdef Matrix_modn_dense_template A = self.new_matrix(nrows=nrows, ncols=ncols)
for i, row in enumerate(rows):
if row < 0 or row >= self._nrows:
raise IndexError("row index out of range")
for j, col in enumerate(columns):
A._matrix[i][j] = self._matrix[row][col]

return A

def __bool__(self):
"""
Test whether this matrix is zero.
Expand Down