Numeric

`numeric` ¶

Functions¶

`calc_communities(starts, ends, edge_weights, louvain_resolution=1.0, out_dir=None, transform_to_epsg_4978=None)` ¶

Build a networkx graph from adjacency information. Each node represents a detection while the edges represent the quality of the matches between detections.

Parameters:

Name	Type	Description	Default
`starts`	`ndarray`	(N, 3) array of ray start points	required
`ends`	`ndarray`	(N, 3) array of ray end points	required
`edge_weights`	`List[Tuple[int, int, Dict[str, float]]]`	List of edges defining the graph connectivity. Each edge is (start_idx, end_idx, weight_dict) where weight_dict contains the edge weight information	required
`louvain_resolution`	`float`	Resolution hyperparameter for the Louvain community detection algorithm. Higher values lead to more communities	`1.0`
`out_dir`	`PATH_TYPE`	Directory to save the output NPZ file containing community information. If None, results are returned as a dictionary	`None`
`transform_to_epsg_4978`	`ndarray`	4x4 transformation matrix to convert points from local coordinates to EPSG:4978 (Earth-centered Earth-fixed)	`None`

Returns:

Type Description

Union[Path, Dict[str, ndarray]]

Union[Path, Dict[str, np.ndarray]]: If out_dir is provided, returns the path to the NPZ file containing the community information. Otherwise returns a dictionary with keys: - 'ray_IDs': (N,) array mapping each ray to its community ID - 'community_points': (M, 3) array of 3D points representing each community - 'community_points_latlon': (M, 3) array of lat/lon points (only if transform_to_epsg_4978 is provided)

Source code in geograypher/utils/numeric.py

def calc_communities(
    starts: np.ndarray,
    ends: np.ndarray,
    edge_weights: typing.List[typing.Tuple[int, int, typing.Dict[str, float]]],
    louvain_resolution: float = 1.0,
    out_dir: typing.Optional[PATH_TYPE] = None,
    transform_to_epsg_4978: typing.Optional[np.ndarray] = None,
) -> typing.Union[Path, typing.Dict[str, np.ndarray]]:
    """
    Build a networkx graph from adjacency information. Each node represents
    a detection while the edges represent the quality of the matches between detections.

    Args:
        starts (np.ndarray): (N, 3) array of ray start points
        ends (np.ndarray): (N, 3) array of ray end points
        edge_weights (List[Tuple[int, int, Dict[str, float]]]): List of edges defining
            the graph connectivity. Each edge is (start_idx, end_idx, weight_dict) where
            weight_dict contains the edge weight information
        louvain_resolution (float): Resolution hyperparameter for the Louvain community
            detection algorithm. Higher values lead to more communities
        out_dir (PATH_TYPE, optional): Directory to save the output NPZ file containing
            community information. If None, results are returned as a dictionary
        transform_to_epsg_4978 (np.ndarray, optional): 4x4 transformation matrix to
            convert points from local coordinates to EPSG:4978 (Earth-centered Earth-fixed)

    Returns:
        Union[Path, Dict[str, np.ndarray]]: If out_dir is provided, returns the path to
            the NPZ file containing the community information. Otherwise returns a
            dictionary with keys:
            - 'ray_IDs': (N,) array mapping each ray to its community ID
            - 'community_points': (M, 3) array of 3D points representing each community
            - 'community_points_latlon': (M, 3) array of lat/lon points (only if
               transform_to_epsg_4978 is provided)
    """

    # Build up the basic graph from edge weights
    graph = networkx.Graph(edge_weights)

    # Check that the graph is non empty
    if len(graph) > 0:

        # Determine Louvain communities which are sets of nodes. Ideally, each
        # community represents a set of detections that correspond to one 3D object
        communities = networkx.community.louvain_communities(
            graph, weight="weight", resolution=louvain_resolution
        )
        # Sort the communities by size
        communities = sorted(communities, key=len, reverse=True)

        # Triangulate the rays for each community to identify the 3D location
        community_points = []
        # Record the community IDs per ray
        num_rays = starts.shape[0]
        ray_IDs = np.full(num_rays, fill_value=np.nan)
        # Iterate over communities
        for community_ID, community in enumerate(
            tqdm(communities, desc="Build community points")
        ):
            # Get the ray indices that belong to that community
            community_indices = np.array(list(community))
            # Record the community ID for the corresponding rays
            ray_IDs[community_indices] = community_ID
            # Use the average of the closest points between rays as the
            # representative point for the community
            community_points.append(
                intersection_average(
                    starts=starts[community_indices],
                    ends=ends[community_indices],
                )
            )

        # Stack all of the points into one vector
        community_points = np.vstack(community_points)

        result = {
            "ray_IDs": ray_IDs,
            "community_points": community_points,
        }

        if transform_to_epsg_4978 is not None:
            # Append a column of all ones to make the homogenous coordinates
            homogenous = np.concatenate(
                [community_points, np.ones_like(community_points[:, 0:1])],
                axis=1,
            )
            # Use the transform matrix to transform the points into the earth
            # centered, earth fixed frame (EPSG:4978)
            community_points_epsg_4978 = (transform_to_epsg_4978 @ homogenous.T).T
            # Convert the points from earth centered, earth fixed frame to lat lon
            community_points_lat_lon = convert_CRS_3D_points(
                community_points_epsg_4978,
                input_CRS=EARTH_CENTERED_EARTH_FIXED_CRS,
                output_CRS=LAT_LON_CRS,
            )
            result["community_points_latlon"] = community_points_lat_lon

    else:
        # Handle the empty case
        result = {
            "ray_IDs": np.zeros((0,), dtype=int),
            "community_points": np.zeros((0, 3)),
        }
        if transform_to_epsg_4978 is not None:
            result["community_points_latlon"] = np.zeros((0, 3))

    if out_dir is not None:
        path = Path(out_dir) / "communities.npz"
        np.savez(path, **result)
        return path
    else:
        return result

`calc_graph_weights(starts, ends, ray_IDs, similarity_threshold, out_dir=None, min_dist=1e-06, step=5000, transform=None)` ¶

This function processes sets of ray segments to build a graph where edges represent ray intersections. The weight of each edge is inversely proportional to the intersection distance between rays. For memory efficiency with large numbers of segments, the computation is done in chunks.

Parameters:

Name	Type	Description	Default
`starts`	`ndarray`	(N, 3) array of ray start points	required
`ends`	`ndarray`	(N, 3) array of ray end points	required
`ray_IDs`	`ndarray`	(N,) array of integers identifying which image each ray comes from	required
`similarity_threshold`	`float`	Maximum intersection distance to consider when creating graph edges. Greater distances will be dropped.	required
`out_dir`	`PATH_TYPE`	Directory to save the output JSON file containing edge information. If None, no file is saved and a list of edge weights is returned instead.	`None`
`min_dist`	`float`	Minimum intersection distance to allow, used to avoid division by zero when calculating weights. Defaults to 1e-6	`1e-06`
`step`	`int`	Number of rays to process in each chunk to manage memory usage. Defaults to 5000	`5000`
`transform`	`callable`	Function to apply to distances before inversion for weight calculation. For example, if you want graph weights to be distance^3, use lambda x: x**3. Defaults to None	`None`

Returns:

Type	Description
`Union[Path, List[Tuple]]`	Union[Path, List[Tuple]]: If out_dir is provided, returns the path to the JSON
`Union[Path, List[Tuple]]`	file containing the edge information. Otherwise returns a list of tuples, each
`Union[Path, List[Tuple]]`	containing (start_idx, end_idx, weight_dict) where weight_dict contains the
`Union[Path, List[Tuple]]`	edge weight information

Source code in geograypher/utils/numeric.py

def calc_graph_weights(
    starts: np.ndarray,
    ends: np.ndarray,
    ray_IDs: np.ndarray,
    similarity_threshold: float,
    out_dir: typing.Optional[PATH_TYPE] = None,
    min_dist: float = 1e-6,
    step: int = 5000,
    transform: typing.Optional[typing.Callable[[np.ndarray], np.ndarray]] = None,
) -> typing.Union[Path, typing.List[typing.Tuple]]:
    """
    This function processes sets of ray segments to build a graph where edges represent
    ray intersections. The weight of each edge is inversely proportional to the
    intersection distance between rays. For memory efficiency with large numbers of
    segments, the computation is done in chunks.

    Args:
        starts (np.ndarray): (N, 3) array of ray start points
        ends (np.ndarray): (N, 3) array of ray end points
        ray_IDs (np.ndarray): (N,) array of integers identifying which image
            each ray comes from
        similarity_threshold (float): Maximum intersection distance to consider when
            creating graph edges. Greater distances will be dropped.
        out_dir (PATH_TYPE, optional): Directory to save the output JSON file containing
            edge information. If None, no file is saved and a list of edge weights
            is returned instead.
        min_dist (float, optional): Minimum intersection distance to allow, used to
            avoid division by zero when calculating weights. Defaults to 1e-6
        step (int, optional): Number of rays to process in each chunk to manage memory
            usage. Defaults to 5000
        transform (callable, optional): Function to apply to distances before inversion
            for weight calculation. For example, if you want graph weights to be
            distance^3, use lambda x: x**3. Defaults to None

    Returns:
        Union[Path, List[Tuple]]: If out_dir is provided, returns the path to the JSON
        file containing the edge information. Otherwise returns a list of tuples, each
        containing (start_idx, end_idx, weight_dict) where weight_dict contains the
        edge weight information
    """

    # Calculate and filter intersection distances
    # For memory reasons, we need to iterate over blocks. When the number of segments starts
    # getting very large, the matrices for calculating ray intersections take a great
    # deal of RAM
    edge_weights = []
    num_steps = np.ceil(len(starts) / step)
    total = int(num_steps * (num_steps + 1) / 2)
    for islice, jslice, diagonal in tqdm(
        chunk_slices(N=len(starts), step=step),
        total=total,
        desc="Calculating graph weights",
    ):
        _, _, dist = compute_approximate_ray_intersections(
            a0=starts[islice],
            a1=ends[islice],
            b0=starts[jslice],
            b1=ends[jslice],
            clamp=True,
        )
        if diagonal:
            np.fill_diagonal(dist, np.nan)
        dist[dist > similarity_threshold] = np.nan
        dist[dist < min_dist] = min_dist

        # Apply transform if provided
        if transform is not None:
            dist = transform(dist)

        # Create edge weights for valid intersections
        edge_weights.extend(format_graph_edges(islice, jslice, dist, ray_IDs))

    if out_dir is None:
        return edge_weights
    else:
        path = Path(out_dir) / "edge_weights.json"
        with path.open("w") as file:
            json.dump(edge_weights, file)
        return path

`chunk_slices(N, step)` ¶

Yield slices for (step, step) chunks of the upper triangular area of an (N, N) square matrix.

For example, if N=5 and step=2, the slices would grab: 1 1 2 2 3 1 1 2 2 3 - - 4 4 5 - - 4 4 5 - - - - 6 And in the (1, 4, 6) cases, is_diag would be True

Yields:

Type	Description
`slice`	Each yielded value is (islice, jslice, is_diag), where:
`slice`	islice: slice along the first axis
`bool`	jslice: slice along the second axis
`Tuple[slice, slice, bool]`	is_diag: True if the chunk is on the diagonal (i == j)

Source code in geograypher/utils/numeric.py

def chunk_slices(
    N: int, step: int
) -> typing.Iterator[typing.Tuple[slice, slice, bool]]:
    """
    Yield slices for (step, step) chunks of the upper triangular area
    of an (N, N) square matrix.

    For example, if N=5 and step=2, the slices would grab:
        1 1 2 2 3
        1 1 2 2 3
        - - 4 4 5
        - - 4 4 5
        - - - - 6
    And in the (1, 4, 6) cases, is_diag would be True

    Yields:
        Each yielded value is (islice, jslice, is_diag), where:
        - islice: slice along the first axis
        - jslice: slice along the second axis
        - is_diag: True if the chunk is on the diagonal (i == j)
    """
    ranges = range(0, N, step)
    for i, j in product(ranges, repeat=2):
        if j >= i:  # upper triangle including diagonal
            islice = slice(i, min(i + step, N))
            jslice = slice(j, min(j + step, N))
            yield islice, jslice, i == j

`compute_3D_triangle_area_vectorized(corners, return_z_proj_area=True)` ¶

summary

Parameters:

Name	Type	Description	Default
`corners`	`ndarray`	(n_faces, n)	required
`return_z_proj_area`	`bool`	description. Defaults to True.	`True`

Returns:

Name	Type	Description
`_type_`		description

Source code in geograypher/utils/numeric.py

def compute_3D_triangle_area_vectorized(corners: np.ndarray, return_z_proj_area=True):
    """_summary_

    Args:
        corners (np.ndarray): (n_faces, n)
        return_z_proj_area (bool, optional): _description_. Defaults to True.

    Returns:
        _type_: _description_
    """
    A, B, C = corners
    # https://math.stackexchange.com/questions/2152754/calculate-3d-triangle-area-by-determinant
    u = B - A
    v = C - A

    # Save for future computation
    u0v1_min_u1v0 = u[0] * v[1] - u[1] * v[0]
    area = (
        1
        / 2
        * np.sqrt(
            np.power(u[1] * v[2] - u[2] * v[1], 2)
            + np.power(u[2] * v[0] - u[0] * v[2], 2)
            + np.power(u0v1_min_u1v0, 2)
        )
    )

    if return_z_proj_area:
        area_z_proj = np.abs(u0v1_min_u1v0) / 2
        return area, area_z_proj

    return area

`compute_approximate_ray_intersections(a0, a1, b0, b1, clamp=False)` ¶

Compute closest points and distances between N line segments a0->a1 and b0->b1. Returns (N, N, 3), (N, N, 3), (N, N). If clamp is True, then respect the line segment ends. If clamp is False, then use the infinite rays.

Based on https://stackoverflow.com/questions/2824478/shortest-distance-between-two-line-segments

Parameters:

Name	Type	Description	Default
`a0`	`ndarray`	Start points of the first segments (N, 3).	required
`a1`	`ndarray`	End points of the first segments (N, 3).	required
`b0`	`ndarray`	Start points of the second segments (N, 3).	required
`b1`	`ndarray`	End points of the second segments (N, 3).	required
`clamp`	`bool`	If True, the closest points are clamped to the segment endpoints. If False, the closest points may be anywhere along the infinite rays.	`False`

Returns:

Name	Type	Description
`pA`	`ndarray`	Closest point on the A segments (axis 0) compared to each of the B segments (axis 1) (N, N, 3). For example, the closest point between A[5] and B[2] at pA[5, 2]
`pB`	`ndarray`	Closest point on the B segments (axis 1) compared to each of the A segments (axis 1) (N, N, 3)
`dist`	`ndarray`	The minimum distance between the A (axis 0) and B (axis 1) segments.

Source code in geograypher/utils/numeric.py

def compute_approximate_ray_intersections(
    a0: np.ndarray, a1: np.ndarray, b0: np.ndarray, b1: np.ndarray, clamp: bool = False
) -> typing.Tuple[np.ndarray, np.ndarray, np.ndarray]:
    """
    Compute closest points and distances between N line segments a0->a1 and
    b0->b1. Returns (N, N, 3), (N, N, 3), (N, N). If clamp is True, then respect
    the line segment ends. If clamp is False, then use the infinite rays.

    Based on https://stackoverflow.com/questions/2824478/shortest-distance-between-two-line-segments

    Args:
        a0 (np.ndarray): Start points of the first segments (N, 3).
        a1 (np.ndarray): End points of the first segments (N, 3).
        b0 (np.ndarray): Start points of the second segments (N, 3).
        b1 (np.ndarray): End points of the second segments (N, 3).
        clamp (bool, optional): If True, the closest points are clamped to the
            segment endpoints. If False, the closest points may be anywhere
            along the infinite rays.

    Returns:
        pA (np.ndarray): Closest point on the A segments (axis 0) compared to
            each of the B segments (axis 1) (N, N, 3). For example, the closest
            point between A[5] and B[2] at pA[5, 2]
        pB (np.ndarray): Closest point on the B segments (axis 1) compared to
            each of the A segments (axis 1) (N, N, 3)
        dist (np.ndarray): The minimum distance between the A (axis 0) and B
            (axis 1) segments.
    """

    # (N, 3) vectors, representing the A and B line segments
    A = a1 - a0
    B = b1 - b0
    # (N,) distances, representing the length of each A and B vector
    magA = np.linalg.norm(A, axis=1)
    magB = np.linalg.norm(B, axis=1)
    # (N, 3) vectors, representing the A and B unit vectors
    _A = A / magA[:, None]
    _B = B / magB[:, None]

    # Expand the A vectors to (N, 1, 3) and the B vectors to (1, N, 3) so that
    # they project together to an (N, N, 3) matrix later
    a0_exp = a0[:, None, :]
    b0_exp = b0[None, :, :]
    _A_exp = _A[:, None, :]
    _B_exp = _B[None, :, :]

    # (N, N, 3) cross product. The cross product of unit vectors calculates the
    # area of the parallelogram formed by the unit vectors, a larger value
    # indicates lines that are more orthogonal
    cross = np.cross(_A_exp, _B_exp)
    # (N, N) representing the squared area of the unit vector parallelograms
    denom = np.linalg.norm(cross, axis=2) ** 2

    # (N, N, 3) matrix, representing the vector from the start of each A
    # segment to the start of each B segment
    t = b0_exp - a0_exp

    # (N, N) matrix, calculate the determinant by multiplying all axes (ijk)
    # and then sum across k, leaving only an ij matrix. The determinant
    # represents how a given transform scales space
    detA = np.einsum("ijk,ijk->ij", np.cross(t, _B_exp), cross)
    detB = np.einsum("ijk,ijk->ij", np.cross(t, _A_exp), cross)

    # Make the denom safe for division by replacing 0 values with 1. Later we
    # check for parallel locations and fix them
    parallel = denom == 0
    denom[parallel] = 1

    # t0 and t1 are (N, N) matrices representing how far along A the closest
    # point is (t0) where 0 is at a0 and 1 is at a1. B and t1 are the same.
    t0 = detA / denom
    t1 = detB / denom

    if clamp:
        # (N, N) matrix where t0 and t1 are clipped to the vector length
        t0_clamped = np.clip(t0, 0, magA[:, None])
        t1_clamped = np.clip(t1, 0, magB[None, :])

        # (N, N, 3) matrix where we start at each vector starting point (a0
        # and b0 expanded) then travel along them to the closest clamped point
        pA = a0_exp + t0_clamped[:, :, None] * _A_exp
        pB = b0_exp + t1_clamped[:, :, None] * _B_exp

        # Check whether the original scale values where out of bounds
        oob_A = (t0 < 0) | (t0 > magA[:, None])
        oob_B = (t1 < 0) | (t1 > magB[None, :])

        # Broadcast a0 and _A to (N, N, 3), similar for b0/_B
        a0_bcast = np.broadcast_to(a0[:, None, :], pA.shape)
        _A_bcast = np.broadcast_to(_A[:, None, :], pA.shape)
        b0_bcast = np.broadcast_to(b0[None, :, :], pB.shape)
        _B_bcast = np.broadcast_to(_B[None, :, :], pB.shape)

        # If any of the scale vectors were clipped, we may have to adjust the
        # closest point on the opposite vector. For example if the closest
        # point on an A vector was clipped, the corresponding B point may need
        # to update
        if np.any(oob_A):
            # Get the projection of the new A point onto the B vectors
            dot = np.einsum("ijk,ijk->ij", pA - b0_bcast, _B_bcast)
            # Get a new B point matching that projection
            dot_clipped = np.clip(dot, 0, magB[None, :])
            pB[oob_A] = b0_bcast[oob_A] + dot_clipped[oob_A, None] * _B_bcast[oob_A]
        if np.any(oob_B):
            # Get the projection of the new B point onto the A vectors
            dot = np.einsum("ijk,ijk->ij", pB - a0_bcast, _A_bcast)
            # Get a new A point matching that projection
            dot_clipped = np.clip(dot, 0, magA[:, None])
            pA[oob_B] = a0_bcast[oob_B] + dot_clipped[oob_B, None] * _A_bcast[oob_B]
    else:
        # If there is no clamping, we use the scale value as-is to get the
        # closest points between the rays
        pA = a0_exp + t0[:, :, None] * _A_exp
        pB = b0_exp + t1[:, :, None] * _B_exp

    # Handle parallel case
    if np.any(parallel):
        # Get the (N, N) projection of each point in b0 onto each unit vector
        # in A. Subtract the (N, 1) projection of each point in a0 along their
        # unit vector. By subtracting them, we calculating whether b0 falls
        # "ahead" or "behind" of a0, along the relevant axis (_A)
        d0 = np.einsum("ij,kj->ik", _A, b0) - np.einsum("ij,ij->i", _A, a0).reshape(
            -1, 1
        )
        if clamp:
            # Same logic as d0, but with a1 and b1
            d1 = np.einsum("ij,kj->ik", _A, b1) - np.einsum("ij,ij->i", _A, a0).reshape(
                -1, 1
            )

            # Check in which of the (N, N) combinations b0 and b1 fall before
            # a0, forming an (N, N) boolean mask
            before = (d0 <= 0) & (d1 <= 0) & parallel
            # Same logic for after
            after = (d0 >= magA[:, None]) & (d1 >= magA[:, None]) & parallel
            # If an A and B vector is parallel and partially overlapping,
            # middle will be true (N, N) boolean mask
            middle = parallel & ~(before | after)

            if np.any(before):
                # Set pA to a0 where relevant
                pA[before] = a0[:, None, :][before]
                # Set pB to whichever endpoint is closer to a0
                pB[before] = np.where(
                    np.abs(d0[before])[:, None] < np.abs(d1[before])[:, None],
                    b0[None, :, :][before],
                    b1[None, :, :][before],
                )

            if np.any(after):
                # Set pA to a1 where relevant
                pA[after] = a1[:, None, :][after]
                # Set pB to whichever endpoint is closer to a1
                pB[after] = np.where(
                    np.abs(d0[after])[:, None] < np.abs(d1[after])[:, None],
                    b0[None, :, :][after],
                    b1[None, :, :][after],
                )

            if np.any(middle):
                # Clip d0 along the A vectors (from 0 to the magnitude of A)
                t_mid = np.clip(
                    d0[middle], 0, np.broadcast_to(magA[:, None], d0.shape)[middle]
                )

                # Get the broadcast components that align with the state we
                # care about (middle)
                a0_bcast = np.broadcast_to(a0[:, None, :], pA.shape)
                _A_bcast = np.broadcast_to(_A[:, None, :], pA.shape)
                a0_mid = a0_bcast[middle]
                _A_mid = _A_bcast[middle]

                # Reproject onto the A vectors
                pA[middle] = a0_mid + t_mid[:, None] * _A_mid

                # Get the vector from the new pA points to b0
                b0_bcast = np.broadcast_to(b0[None, :, :], pB.shape)
                a2b = b0_bcast[middle] - pA[middle]

                # Then subtract the component that is along the A vectors, and
                # that gives us the final pB location
                alongA = np.einsum("ij,ij->i", a2b, _A_mid)[:, None] * _A_mid
                pB[middle] = pA[middle] + (a2b - alongA)

        else:
            # If we're not clamping, arbitrarily set the parallel "closest
            # points" to b0 and the matching point on A
            a0_bcast = np.broadcast_to(a0[:, None, :], pA.shape)
            b0_bcast = np.broadcast_to(b0[None, :, :], pB.shape)
            _A_bcast = np.broadcast_to(_A[:, None, :], pA.shape)
            pA[parallel] = (
                a0_bcast[parallel] + d0[:, :, None][parallel] * _A_bcast[parallel]
            )
            pB[parallel] = b0_bcast[parallel]

    # pA and pB are existing (N, N, 3) matrices. In addition, calculate the
    # (N, N) distances between each pair
    return pA, pB, np.linalg.norm(pA - pB, axis=2)

`create_ramped_weighting(rectangle_shape, ramp_dist_frac)` ¶

Create a ramped weighting that is higher toward the center with a max value of 1 at a fraction from the edge

Parameters:

Name	Type	Description	Default
`rectangle_shape`	`Tuple[int, int]`	Size of rectangle to create a mask for	required
`ramp_dist_frac`	`float`	Portions at least this far from an edge will have full weight	required

Returns:

Type	Description
`ndarray`	np.ndarray: An array representing the weighting from 0-1

Source code in geograypher/utils/numeric.py

def create_ramped_weighting(
    rectangle_shape: typing.Tuple[int, int], ramp_dist_frac: float
) -> np.ndarray:
    """Create a ramped weighting that is higher toward the center with a max value of 1 at a fraction from the edge

    Args:
        rectangle_shape (typing.Tuple[int, int]): Size of rectangle to create a mask for
        ramp_dist_frac (float): Portions at least this far from an edge will have full weight

    Returns:
        np.ndarray: An array representing the weighting from 0-1
    """
    i_ramp = np.clip(np.linspace(0, 1 / ramp_dist_frac, num=rectangle_shape[0]), 0, 1)
    j_ramp = np.clip(np.linspace(0, 1 / ramp_dist_frac, num=rectangle_shape[1]), 0, 1)

    i_ramp = np.minimum(i_ramp, np.flip(i_ramp))
    j_ramp = np.minimum(j_ramp, np.flip(j_ramp))

    i_ramp = np.expand_dims(i_ramp, 1)
    j_ramp = np.expand_dims(j_ramp, 0)

    ramped_weighting = np.minimum(i_ramp, j_ramp)
    return ramped_weighting

`fair_mode_non_nan(values)` ¶

Compute the most common value per row in an array of integers and nans. This behaves similarly to scipy.stats.mode(values, axis=1, nan_policy="omit") except that for values with equal counts, one is chosen randomly, rather than taking the lower value.

Parameters:

Name	Type	Description	Default
`values`	`ndarray`	(n, m) The input values (float-typed), consisting of integers and nans	required

Returns:

Type	Description
`ndarray`	np.ndarray: (n,) the most common value per row

Source code in geograypher/utils/numeric.py

def fair_mode_non_nan(values: np.ndarray) -> np.ndarray:
    """
    Compute the most common value per row in an array of integers and nans. This behaves similarly to
    scipy.stats.mode(values, axis=1, nan_policy="omit") except that for values with equal counts,
    one is chosen randomly, rather than taking the lower value.

    Args:
        values (np.ndarray): (n, m) The input values (float-typed), consisting of integers and nans

    Returns:
        np.ndarray: (n,) the most common value per row
    """
    max_val = np.nanmax(values)
    # All input values are nan, return all nans
    if np.isnan(max_val):
        return np.full((values.shape[0],), fill_value=np.nan)

    max_val = int(max_val)
    # TODO consider using unique if these indices are sparse
    counts_per_value_per_row = np.array(
        [np.sum(values == i, axis=1) for i in range(max_val + 1)]
    ).T
    # Check which entires had no classes reported and mask them out
    # TODO consider removing these rows beforehand
    zeros_mask = np.all(counts_per_value_per_row == 0, axis=1)
    # We want to fairly tiebreak since np.argmax will always take th first index
    # This is hard to do in a vectorized way, so we just add a small random value
    # independently to each element
    counts_per_value_per_row = (
        counts_per_value_per_row
        + np.random.random(counts_per_value_per_row.shape) * 0.5
    )
    most_common_value_per_row = np.argmax(counts_per_value_per_row, axis=1).astype(
        float
    )
    # Set any faces with zero counts to nan
    most_common_value_per_row[zeros_mask] = np.nan
    return most_common_value_per_row

`format_graph_edges(islice, jslice, dist, ray_IDs)` ¶

This function generates edge definitions for a graph where nodes represent rays and edges represent valid intersections between rays. It applies three filtering criteria: 1. Only uses edges where (i, j) is finite (not NaN) 2. Only uses edges where i < j (keeps it upper triangular) 3. Only uses edges between rays from different images (different ray_IDs)

Parameters:

Name	Type	Description	Default
`islice`	`slice`	Slice indicating the block of rows being processed in the chunked computation	required
`jslice`	`slice`	Slice indicating the block of columns being processed in the chunked computation	required
`dist`	`ndarray`	Distance matrix containing distances between rays (chunked) This is the [islice, jslice] section of a larger distance matrix.	required
`ray_IDs`	`ndarray`	Array of identifiers indicating which image each ray comes from (not chunked)	required

Returns:

Type	Description
`List[Tuple[int, int, Dict[str, float]]]`	List[Tuple[int, int, Dict[str, float]]]: List of edge definitions, where each edge
`List[Tuple[int, int, Dict[str, float]]]`	is a tuple of
`List[Tuple[int, int, Dict[str, float]]]`	i index in the adjacency matrix
`List[Tuple[int, int, Dict[str, float]]]`	j index in the adjacency matrix
`List[Tuple[int, int, Dict[str, float]]]`	weight_dict of the form {"weight": value}

Source code in geograypher/utils/numeric.py

def format_graph_edges(
    islice: slice,
    jslice: slice,
    dist: np.ndarray,
    ray_IDs: np.ndarray,
) -> typing.List[typing.Tuple[int, int, typing.Dict[str, float]]]:
    """
    This function generates edge definitions for a graph where nodes represent rays and
    edges represent valid intersections between rays. It applies three filtering criteria:
    1. Only uses edges where (i, j) is finite (not NaN)
    2. Only uses edges where i < j (keeps it upper triangular)
    3. Only uses edges between rays from different images (different ray_IDs)

    Args:
        islice (slice): Slice indicating the block of rows being processed in the
            chunked computation
        jslice (slice): Slice indicating the block of columns being processed in
            the chunked computation
        dist (np.ndarray): Distance matrix containing distances between rays (chunked)
            This is the [islice, jslice] section of a larger distance matrix.
        ray_IDs (np.ndarray): Array of identifiers indicating which image each ray comes
            from (not chunked)

    Returns:
        List[Tuple[int, int, Dict[str, float]]]: List of edge definitions, where each edge
        is a tuple of
        - i index in the adjacency matrix
        - j index in the adjacency matrix
        - weight_dict of the form {"weight": value}
    """

    # The places where the array is finite are the valid graph distances
    i_inds, j_inds = np.where(np.isfinite(dist))

    # Pre-calculate the inverse distance
    weights = 1 / dist

    return [
        (
            int(i) + islice.start,
            int(j) + jslice.start,
            {"weight": float(weights[i, j])},
        )
        for i, j in zip(i_inds, j_inds)
        if (i + islice.start < j + jslice.start)
        and (ray_IDs[i + islice.start] != ray_IDs[j + jslice.start])
    ]

`intersection_average(starts, ends)` ¶

Given arrays of line segment start and end points, compute the average of the closest intersection points between all pairs of segments.

Parameters:

Name	Type	Description	Default
`starts`	`ndarray`	(N, 3) array of segment start points	required
`ends`	`ndarray`	(N, 3) array of segment end points	required

Returns:

Type	Description
`ndarray`	np.ndarray: (3,) array, the average intersection point

Source code in geograypher/utils/numeric.py

def intersection_average(starts: np.ndarray, ends: np.ndarray) -> np.ndarray:
    """
    Given arrays of line segment start and end points, compute the average of the closest
    intersection points between all pairs of segments.

    Args:
        starts (np.ndarray): (N, 3) array of segment start points
        ends (np.ndarray): (N, 3) array of segment end points

    Returns:
        np.ndarray: (3,) array, the average intersection point
    """
    closest_points = []
    pA, pB, _ = compute_approximate_ray_intersections(
        a0=starts, a1=ends, b0=starts, b1=ends, clamp=True
    )
    mask = ~np.eye(starts.shape[0], dtype=bool)
    return np.mean(np.vstack([pA[mask], pB[mask]]), axis=0)

Numeric

numeric ¶

Functions¶

calc_communities(starts, ends, edge_weights, louvain_resolution=1.0, out_dir=None, transform_to_epsg_4978=None) ¶

calc_graph_weights(starts, ends, ray_IDs, similarity_threshold, out_dir=None, min_dist=1e-06, step=5000, transform=None) ¶

chunk_slices(N, step) ¶

compute_3D_triangle_area_vectorized(corners, return_z_proj_area=True) ¶

compute_approximate_ray_intersections(a0, a1, b0, b1, clamp=False) ¶

create_ramped_weighting(rectangle_shape, ramp_dist_frac) ¶

fair_mode_non_nan(values) ¶

format_graph_edges(islice, jslice, dist, ray_IDs) ¶

intersection_average(starts, ends) ¶

`numeric` ¶

`calc_communities(starts, ends, edge_weights, louvain_resolution=1.0, out_dir=None, transform_to_epsg_4978=None)` ¶

`calc_graph_weights(starts, ends, ray_IDs, similarity_threshold, out_dir=None, min_dist=1e-06, step=5000, transform=None)` ¶

`chunk_slices(N, step)` ¶

`compute_3D_triangle_area_vectorized(corners, return_z_proj_area=True)` ¶

`compute_approximate_ray_intersections(a0, a1, b0, b1, clamp=False)` ¶

`create_ramped_weighting(rectangle_shape, ramp_dist_frac)` ¶

`fair_mode_non_nan(values)` ¶

`format_graph_edges(islice, jslice, dist, ray_IDs)` ¶

`intersection_average(starts, ends)` ¶