Coverage for /pythoncovmergedfiles/medio/medio/usr/local/lib/python3.8/site-packages/scipy/spatial/

1"""

2This module provides functions to perform full Procrustes analysis.

4This code was originally written by Justin Kucynski and ported over from

5scikit-bio by Yoshiki Vazquez-Baeza.

6"""

8import numpy as np

9from scipy.linalg import orthogonal_procrustes

12__all__ = ['procrustes']

15def procrustes(data1, data2):

16 r"""Procrustes analysis, a similarity test for two data sets.

18 Each input matrix is a set of points or vectors (the rows of the matrix).

19 The dimension of the space is the number of columns of each matrix. Given

20 two identically sized matrices, procrustes standardizes both such that:

22 - :math:`tr(AA^{T}) = 1`.

24 - Both sets of points are centered around the origin.

26 Procrustes ([1]_, [2]_) then applies the optimal transform to the second

27 matrix (including scaling/dilation, rotations, and reflections) to minimize

28 :math:`M^{2}=\sum(data1-data2)^{2}`, or the sum of the squares of the

29 pointwise differences between the two input datasets.

31 This function was not designed to handle datasets with different numbers of

32 datapoints (rows). If two data sets have different dimensionality

33 (different number of columns), simply add columns of zeros to the smaller

34 of the two.

36 Parameters

37 ----------

38 data1 : array_like

39 Matrix, n rows represent points in k (columns) space `data1` is the

40 reference data, after it is standardised, the data from `data2` will be

41 transformed to fit the pattern in `data1` (must have >1 unique points).

42 data2 : array_like

43 n rows of data in k space to be fit to `data1`. Must be the same

44 shape ``(numrows, numcols)`` as data1 (must have >1 unique points).

46 Returns

47 -------

48 mtx1 : array_like

49 A standardized version of `data1`.

50 mtx2 : array_like

51 The orientation of `data2` that best fits `data1`. Centered, but not

52 necessarily :math:`tr(AA^{T}) = 1`.

53 disparity : float

54 :math:`M^{2}` as defined above.

56 Raises

57 ------

58 ValueError

59 If the input arrays are not two-dimensional.

60 If the shape of the input arrays is different.

61 If the input arrays have zero columns or zero rows.

63 See Also

64 --------

65 scipy.linalg.orthogonal_procrustes

66 scipy.spatial.distance.directed_hausdorff : Another similarity test

67 for two data sets

69 Notes

70 -----

71 - The disparity should not depend on the order of the input matrices, but

72 the output matrices will, as only the first output matrix is guaranteed

73 to be scaled such that :math:`tr(AA^{T}) = 1`.

75 - Duplicate data points are generally ok, duplicating a data point will

76 increase its effect on the procrustes fit.

78 - The disparity scales as the number of points per input matrix.

80 References

81 ----------

82 .. [1] Krzanowski, W. J. (2000). "Principles of Multivariate analysis".

83 .. [2] Gower, J. C. (1975). "Generalized procrustes analysis".

85 Examples

86 --------

87 >>> import numpy as np

88 >>> from scipy.spatial import procrustes

90 The matrix ``b`` is a rotated, shifted, scaled and mirrored version of

91 ``a`` here:

93 >>> a = np.array([[1, 3], [1, 2], [1, 1], [2, 1]], 'd')

94 >>> b = np.array([[4, -2], [4, -4], [4, -6], [2, -6]], 'd')

95 >>> mtx1, mtx2, disparity = procrustes(a, b)

96 >>> round(disparity)

97 0.0

99 """

100 mtx1 = np.array(data1, dtype=np.double, copy=True)

101 mtx2 = np.array(data2, dtype=np.double, copy=True)

102

103 if mtx1.ndim != 2 or mtx2.ndim != 2:

104 raise ValueError("Input matrices must be two-dimensional")

105 if mtx1.shape != mtx2.shape:

106 raise ValueError("Input matrices must be of same shape")

107 if mtx1.size == 0:

108 raise ValueError("Input matrices must be >0 rows and >0 cols")

109

110 # translate all the data to the origin

111 mtx1 -= np.mean(mtx1, 0)

112 mtx2 -= np.mean(mtx2, 0)

113

114 norm1 = np.linalg.norm(mtx1)

115 norm2 = np.linalg.norm(mtx2)

116

117 if norm1 == 0 or norm2 == 0:

118 raise ValueError("Input matrices must contain >1 unique points")

119

120 # change scaling of data (in rows) such that trace(mtx*mtx') = 1

121 mtx1 /= norm1

122 mtx2 /= norm2

123

124 # transform mtx2 to minimize disparity

125 R, s = orthogonal_procrustes(mtx1, mtx2)

126 mtx2 = np.dot(mtx2, R.T) * s

127

128 # measure the dissimilarity between the two datasets

129 disparity = np.sum(np.square(mtx1 - mtx2))

130

131 return mtx1, mtx2, disparity

132

Coverage for /pythoncovmergedfiles/medio/medio/usr/local/lib/python3.8/site-packages/scipy/spatial/_procrustes.py: 17%

24 statements