Skip to content

GARSPandas module

GARSPandas

Source code in vgridpandas/garspandas.py
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
@pd.api.extensions.register_dataframe_accessor("gars")
class GARSPandas:
    def __init__(self, df: DataFrame):
        self._df = df

    # gars API
    # These methods simply mirror the Vgrid gars API and apply gars functions to all rows

    def latlon2gars(
        self,
        resolution: int,
        lat_col: str = "lat",
        lon_col: str = "lon",
        set_index: bool = False,
    ) -> AnyDataFrame:
        """Adds gars ID to (Geo)DataFrame.

        pd.DataFrame: uses `lat_col` and `lon_col` (default `lat` and `lon`)
        gpd.GeoDataFrame: uses `geometry`

        Assumes coordinates in epsg=4326.

        Parameters
        ----------
        resolution : int
            gars resolution
        lat_col : str
            Name of the latitude column (if used), default 'lat'
        lon_col : str
            Name of the longitude column (if used), default 'lon'
        set_index : bool
            If True, the columns with gars ID is set as index, default 'True'

        Returns
        -------
        (Geo)DataFrame with gars IDs added
        """

        if isinstance(self._df, gpd.GeoDataFrame):
            lons = self._df.geometry.x
            lats = self._df.geometry.y
        else:
            lons = self._df[lon_col]
            lats = self._df[lat_col]

        gars_ids = [
            latlon_to_gars(lat, lon, resolution) for lat, lon in zip(lats, lons)
        ]

        gars_col = GARS_COL
        assign_arg = {gars_col: gars_ids, f"{gars_col}_res": resolution}
        df = self._df.assign(**assign_arg)
        if set_index:
            return df.set_index(gars_col)
        return df

    def gars2geo(self, gars_col: str = None) -> GeoDataFrame:
        """Add geometry with GARS geometry to the DataFrame."""
        if gars_col is not None:
            if gars_col not in self._df.columns:
                raise ValueError(f"Column '{gars_col}' not found in DataFrame")
            ids = self._df[gars_col]
        else:
            if GARS_COL not in self._df.columns:
                raise ValueError(f"Column '{GARS_COL}' not found in DataFrame")
            ids = self._df[GARS_COL]
        return dggs_ids_to_geodataframe(self._df, ids, gars_to_geo)

    def garsbin(
        self,
        resolution: int,
        stats: str = "count",
        numeric_col: str = None,
        category_col: str = None,
        lat_col: str = "lat",
        lon_col: str = "lon",
    ) -> GeoDataFrame:
        """
        Bin points into gars cells and compute statistics.
        """
        gars_col = GARS_COL
        df = self.latlon2gars(resolution, lat_col, lon_col)
        result = aggregate_bin(df, gars_col, stats, numeric_col, category_col)
        return result.gars.gars2geo(gars_col=gars_col)

gars2geo(gars_col=None)

Add geometry with GARS geometry to the DataFrame.

Source code in vgridpandas/garspandas.py
70
71
72
73
74
75
76
77
78
79
80
def gars2geo(self, gars_col: str = None) -> GeoDataFrame:
    """Add geometry with GARS geometry to the DataFrame."""
    if gars_col is not None:
        if gars_col not in self._df.columns:
            raise ValueError(f"Column '{gars_col}' not found in DataFrame")
        ids = self._df[gars_col]
    else:
        if GARS_COL not in self._df.columns:
            raise ValueError(f"Column '{GARS_COL}' not found in DataFrame")
        ids = self._df[GARS_COL]
    return dggs_ids_to_geodataframe(self._df, ids, gars_to_geo)

garsbin(resolution, stats='count', numeric_col=None, category_col=None, lat_col='lat', lon_col='lon')

Bin points into gars cells and compute statistics.

Source code in vgridpandas/garspandas.py
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
def garsbin(
    self,
    resolution: int,
    stats: str = "count",
    numeric_col: str = None,
    category_col: str = None,
    lat_col: str = "lat",
    lon_col: str = "lon",
) -> GeoDataFrame:
    """
    Bin points into gars cells and compute statistics.
    """
    gars_col = GARS_COL
    df = self.latlon2gars(resolution, lat_col, lon_col)
    result = aggregate_bin(df, gars_col, stats, numeric_col, category_col)
    return result.gars.gars2geo(gars_col=gars_col)

latlon2gars(resolution, lat_col='lat', lon_col='lon', set_index=False)

Adds gars ID to (Geo)DataFrame.

pd.DataFrame: uses lat_col and lon_col (default lat and lon) gpd.GeoDataFrame: uses geometry

Assumes coordinates in epsg=4326.

Parameters

resolution : int gars resolution lat_col : str Name of the latitude column (if used), default 'lat' lon_col : str Name of the longitude column (if used), default 'lon' set_index : bool If True, the columns with gars ID is set as index, default 'True'

Returns

(Geo)DataFrame with gars IDs added

Source code in vgridpandas/garspandas.py
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
def latlon2gars(
    self,
    resolution: int,
    lat_col: str = "lat",
    lon_col: str = "lon",
    set_index: bool = False,
) -> AnyDataFrame:
    """Adds gars ID to (Geo)DataFrame.

    pd.DataFrame: uses `lat_col` and `lon_col` (default `lat` and `lon`)
    gpd.GeoDataFrame: uses `geometry`

    Assumes coordinates in epsg=4326.

    Parameters
    ----------
    resolution : int
        gars resolution
    lat_col : str
        Name of the latitude column (if used), default 'lat'
    lon_col : str
        Name of the longitude column (if used), default 'lon'
    set_index : bool
        If True, the columns with gars ID is set as index, default 'True'

    Returns
    -------
    (Geo)DataFrame with gars IDs added
    """

    if isinstance(self._df, gpd.GeoDataFrame):
        lons = self._df.geometry.x
        lats = self._df.geometry.y
    else:
        lons = self._df[lon_col]
        lats = self._df[lat_col]

    gars_ids = [
        latlon_to_gars(lat, lon, resolution) for lat, lon in zip(lats, lons)
    ]

    gars_col = GARS_COL
    assign_arg = {gars_col: gars_ids, f"{gars_col}_res": resolution}
    df = self._df.assign(**assign_arg)
    if set_index:
        return df.set_index(gars_col)
    return df