Geoparquet loader
In [1]:
Copied!
import geopandas as gpd
from shapely.geometry import box
from srai.constants import WGS84_CRS
from srai.loaders import GeoparquetLoader
import geopandas as gpd
from shapely.geometry import box
from srai.constants import WGS84_CRS
from srai.loaders import GeoparquetLoader
Basic usage¶
In [2]:
Copied!
gpql = GeoparquetLoader()
gpql = GeoparquetLoader()
In [3]:
Copied!
base_gdf = gpql.load(file_path="example_files/example.parquet")
base_gdf
base_gdf = gpql.load(file_path="example_files/example.parquet")
base_gdf
Out[3]:
| pop_est | continent | name | iso_a3 | gdp_md_est | geometry | |
|---|---|---|---|---|---|---|
| 0 | 920938 | Oceania | Fiji | FJI | 8374.0 | MULTIPOLYGON (((180 -16.06713, 180 -16.55522, ... | 
| 1 | 53950935 | Africa | Tanzania | TZA | 150600.0 | POLYGON ((33.90371 -0.95, 34.07262 -1.05982, 3... | 
| 2 | 603253 | Africa | W. Sahara | ESH | 906.5 | POLYGON ((-8.66559 27.65643, -8.66512 27.58948... | 
| 3 | 35623680 | North America | Canada | CAN | 1674000.0 | MULTIPOLYGON (((-122.84 49, -122.97421 49.0025... | 
| 4 | 326625791 | North America | United States of America | USA | 18560000.0 | MULTIPOLYGON (((-122.84 49, -120 49, -117.0312... | 
In [4]:
Copied!
base_gdf.explore()
base_gdf.explore()
Out[4]:
Make this Notebook Trusted to load map: File -> Trust Notebook
In [5]:
Copied!
indexed_gdf = gpql.load(file_path="example_files/example.parquet", index_column="name")
indexed_gdf
indexed_gdf = gpql.load(file_path="example_files/example.parquet", index_column="name")
indexed_gdf
Out[5]:
| pop_est | continent | iso_a3 | gdp_md_est | geometry | |
|---|---|---|---|---|---|
| name | |||||
| Fiji | 920938 | Oceania | FJI | 8374.0 | MULTIPOLYGON (((180 -16.06713, 180 -16.55522, ... | 
| Tanzania | 53950935 | Africa | TZA | 150600.0 | POLYGON ((33.90371 -0.95, 34.07262 -1.05982, 3... | 
| W. Sahara | 603253 | Africa | ESH | 906.5 | POLYGON ((-8.66559 27.65643, -8.66512 27.58948... | 
| Canada | 35623680 | North America | CAN | 1674000.0 | MULTIPOLYGON (((-122.84 49, -122.97421 49.0025... | 
| United States of America | 326625791 | North America | USA | 18560000.0 | MULTIPOLYGON (((-122.84 49, -120 49, -117.0312... | 
In [6]:
Copied!
limited_gdf = gpql.load(
    file_path="example_files/example.parquet", columns=["continent", "name", "pop_est"]
)
limited_gdf
limited_gdf = gpql.load(
    file_path="example_files/example.parquet", columns=["continent", "name", "pop_est"]
)
limited_gdf
Out[6]:
| continent | name | pop_est | geometry | |
|---|---|---|---|---|
| 0 | Oceania | Fiji | 920938 | MULTIPOLYGON (((180 -16.06713, 180 -16.55522, ... | 
| 1 | Africa | Tanzania | 53950935 | POLYGON ((33.90371 -0.95, 34.07262 -1.05982, 3... | 
| 2 | Africa | W. Sahara | 603253 | POLYGON ((-8.66559 27.65643, -8.66512 27.58948... | 
| 3 | North America | Canada | 35623680 | MULTIPOLYGON (((-122.84 49, -122.97421 49.0025... | 
| 4 | North America | United States of America | 326625791 | MULTIPOLYGON (((-122.84 49, -120 49, -117.0312... | 
In [7]:
Copied!
# Create Texas bounding box
bbox = box(minx=-106.645646, maxx=-93.508292, miny=25.837377, maxy=36.500704)
bbox_gdf = gpd.GeoDataFrame({"geometry": [bbox]}, crs=WGS84_CRS)
cut_gdf = gpql.load(file_path="example_files/example.parquet", area=bbox_gdf)
cut_gdf
# Create Texas bounding box
bbox = box(minx=-106.645646, maxx=-93.508292, miny=25.837377, maxy=36.500704)
bbox_gdf = gpd.GeoDataFrame({"geometry": [bbox]}, crs=WGS84_CRS)
cut_gdf = gpql.load(file_path="example_files/example.parquet", area=bbox_gdf)
cut_gdf
Out[7]:
| pop_est | continent | name | iso_a3 | gdp_md_est | geometry | |
|---|---|---|---|---|---|---|
| 4 | 326625791 | North America | United States of America | USA | 18560000.0 | POLYGON ((-93.84842 29.71363, -94.69 29.48, -9... | 
In [8]:
Copied!
cut_gdf.explore()
cut_gdf.explore()
Out[8]:
Make this Notebook Trusted to load map: File -> Trust Notebook