Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Updated algorithm to split aoi when no linear features #31

Merged
merged 10 commits into from
Jun 5, 2024
9 changes: 5 additions & 4 deletions .pre-commit-config.yaml
Original file line number Diff line number Diff line change
@@ -1,15 +1,15 @@
repos:
# Versioning: Commit messages & changelog
- repo: https://github.com/commitizen-tools/commitizen
rev: v3.13.0
rev: v3.27.0
hooks:
- id: commitizen
stages: [commit-msg]

# Lint / autoformat: Python code
- repo: https://github.com/astral-sh/ruff-pre-commit
# Ruff version.
rev: "v0.1.6"
rev: "v0.4.7"
hooks:
# Run the linter
- id: ruff
Expand All @@ -19,9 +19,10 @@ repos:

# Autoformat: YAML, JSON, Markdown, etc.
- repo: https://github.com/pre-commit/mirrors-prettier
rev: v3.1.0
rev: v4.0.0-alpha.8
hooks:
- id: prettier
entry: env PRETTIER_LEGACY_CLI=1 prettier
args:
[
--ignore-unknown,
Expand All @@ -33,7 +34,7 @@ repos:
]
# Lint: Markdown
- repo: https://github.com/igorshubovych/markdownlint-cli
rev: v0.38.0
rev: v0.41.0
hooks:
- id: markdownlint
args:
Expand Down
2 changes: 0 additions & 2 deletions docker-compose.yml
Original file line number Diff line number Diff line change
Expand Up @@ -15,8 +15,6 @@
# along with fmtm-splitter. If not, see <https:#www.gnu.org/licenses/>.
#

version: "3"

networks:
net:
name: fmtm-splitter
Expand Down
1 change: 1 addition & 0 deletions fmtm_splitter/db.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,7 @@
# along with fmtm-splitter. If not, see <https:#www.gnu.org/licenses/>.
#
"""DB models for temporary tables in splitBySQL."""

import logging
from typing import Union

Expand Down
208 changes: 142 additions & 66 deletions fmtm_splitter/fmtm_algorithm.sql
Original file line number Diff line number Diff line change
@@ -1,67 +1,97 @@
DROP TABLE IF EXISTS polygonsnocount;
-- Create a new polygon layer of splits by lines

CREATE TABLE polygonsnocount AS (
-- The Area of Interest provided by the person creating the project
WITH aoi AS (
SELECT * FROM "project_aoi"
)
-- Extract all lines to be used as splitlines from a table of lines
-- with the schema from Underpass (all tags as jsonb column called 'tags')
-- TODO: add polygons (closed ways in OSM) with a 'highway' tag;
-- some features such as roundabouts appear as polygons.
-- TODO: add waterway polygons; now a beach doesn't show up as a splitline.
-- TODO: these tags should come from another table rather than hardcoded
-- so that they're easily configured during project creation.
,splitlines AS (
-- SELECT ST_Intersection(a.geom, l.geom) AS geom
-- FROM aoi a, "ways_line" l
-- WHERE ST_Intersects(a.geom, l.geom)
-- -- TODO: these tags should come from a config table
-- -- All highways, waterways, and railways
-- AND (l.tags->>'highway' IS NOT NULL
-- OR l.tags->>'waterway' IS NOT NULL
-- OR l.tags->>'railway' IS NOT NULL
-- )

SELECT * from lines_view l
WHERE l.tags->>'highway' IS NOT NULL
OR l.tags->>'waterway' IS NOT NULL
OR l.tags->>'railway' IS NOT NULL
DO $$
DECLARE
lines_count INTEGER;
num_buildings INTEGER;
BEGIN
-- Check if ways_line has any data
SELECT COUNT(*) INTO lines_count FROM ways_line;

IF lines_count > 0 THEN
CREATE TABLE polygonsnocount AS (

)
-- Merge all lines, necessary so that the polygonize function works later
,merged AS (
SELECT ST_LineMerge(ST_Union(splitlines.geom)) AS geom
FROM splitlines
)
-- Combine the boundary of the AOI with the splitlines
-- First extract the Area of Interest boundary as a line
,boundary AS (
SELECT ST_Boundary(geom) AS geom
FROM aoi
)
-- Then combine it with the splitlines
,comb AS (
SELECT ST_Union(boundary.geom, merged.geom) AS geom
FROM boundary, merged
)
-- TODO add closed ways from OSM to lines (roundabouts etc)
-- Create a polygon for each area enclosed by the splitlines
,splitpolysnoindex AS (
SELECT (ST_Dump(ST_Polygonize(comb.geom))).geom as geom
FROM comb
)
-- Add an index column to the split polygons
,splitpolygons AS(
SELECT
row_number () over () as polyid,
ST_Transform(spni.geom,4326)::geography AS geog,
spni.*
from splitpolysnoindex spni
)
SELECT * FROM splitpolygons
);
-- The Area of Interest provided by the person creating the project
WITH aoi AS (
SELECT * FROM "project_aoi"
)
-- Extract all lines to be used as splitlines from a table of lines
-- with the schema from Underpass (all tags as jsonb column called 'tags')
-- TODO: add polygons (closed ways in OSM) with a 'highway' tag;
-- some features such as roundabouts appear as polygons.
-- TODO: add waterway polygons; now a beach doesn't show up as a splitline.
-- TODO: these tags should come from another table rather than hardcoded
-- so that they're easily configured during project creation.
, splitlines AS (
SELECT ST_Intersection(a.geom, l.geom) AS geom
FROM aoi a
JOIN "ways_line" l ON ST_Intersects(a.geom, l.geom)
WHERE (
(l.tags->>'highway' IS NOT NULL AND
l.tags->>'highway' NOT IN ('unclassified', 'residential', 'service', 'pedestrian', 'track', 'bus_guideway')) -- TODO: update(add/remove) this based on the requirements later
OR l.tags->>'waterway' IS NOT NULL
OR l.tags->>'railway' IS NOT NULL
)
)

-- SELECT * from lines_view l
-- WHERE (
-- (l.tags->>'highway' IS NOT NULL AND
-- l.tags->>'highway' NOT IN ('unclassified', 'residential', 'service', 'pedestrian', 'track', 'bus_guideway'))
-- OR l.tags->>'waterway' IS NOT NULL
-- OR l.tags->>'railway' IS NOT NULL
-- )
-- )
-- Merge all lines, necessary so that the polygonize function works later
,merged AS (
SELECT ST_LineMerge(ST_Union(splitlines.geom)) AS geom
FROM splitlines
)
-- Combine the boundary of the AOI with the splitlines
-- First extract the Area of Interest boundary as a line
,boundary AS (
SELECT ST_Boundary(geom) AS geom
FROM aoi
)
-- Then combine it with the splitlines
,comb AS (
SELECT ST_Union(boundary.geom, merged.geom) AS geom
FROM boundary, merged
)
-- TODO add closed ways from OSM to lines (roundabouts etc)
-- Create a polygon for each area enclosed by the splitlines
,splitpolysnoindex AS (
SELECT (ST_Dump(ST_Polygonize(comb.geom))).geom as geom
FROM comb
)
-- Add an index column to the split polygons
,splitpolygons AS(
SELECT
row_number () over () as polyid,
ST_Transform(spni.geom,4326)::geography AS geog,
spni.*
from splitpolysnoindex spni
)
SELECT * FROM splitpolygons
);
ELSE
-- Calculate number of buildings per cluster
CREATE TABLE polygonsnocount AS (
WITH aoi AS (
SELECT * FROM "project_aoi"
)
,transformed_aoi AS(
SELECT
row_number () over () as polyid,
ST_Transform(aoi.geom,4326)::geography AS geog,
aoi.geom
from aoi
)
SELECT * FROM transformed_aoi
);
END IF;
END $$;


-- Make that index column a primary key
Expand Down Expand Up @@ -130,7 +160,7 @@ with lowfeaturecountpolys as (
select *
from splitpolygons as p
-- TODO: feature count should not be hard-coded
where p.numfeatures < 20
where p.numfeatures < %(num_buildings)s
),
-- Find the neighbors of the low-feature-count polygons
-- Store their ids as n_polyid, numfeatures as n_numfeatures, etc
Expand Down Expand Up @@ -258,15 +288,61 @@ USING GIST (geom);
-- VACUUM ANALYZE voronois;
DROP TABLE voronoids;

DROP TABLE IF EXISTS unsimplifiedtaskpolygons;
CREATE TABLE unsimplifiedtaskpolygons AS (
SELECT ST_Union(geom) as geom, clusteruid
FROM voronois
GROUP BY clusteruid
);

CREATE INDEX unsimplifiedtaskpolygons_idx
ON unsimplifiedtaskpolygons
USING GIST (geom);

--VACUUM ANALYZE unsimplifiedtaskpolygons;


--*****************************Simplify*******************************
-- Extract unique line segments
DROP TABLE IF EXISTS taskpolygons;
CREATE TABLE taskpolygons AS (
SELECT ST_Union(geom) as geom, clusteruid
FROM voronois
GROUP BY clusteruid
--Convert task polygon boundaries to linestrings
WITH rawlines AS (
SELECT utp.clusteruid, st_boundary(utp.geom) AS geom
FROM unsimplifiedtaskpolygons AS utp
)
-- Union, which eliminates duplicates from adjacent polygon boundaries
,unionlines AS (
SELECT st_union(l.geom) AS geom FROM rawlines l
)
-- Dump, which gives unique segments.
,segments AS (
SELECT (st_dump(l.geom)).geom AS geom
FROM unionlines l
)
,agglomerated AS (
SELECT st_linemerge(st_unaryunion(st_collect(s.geom))) AS geom
FROM segments s
)
,simplifiedlines AS (
SELECT st_simplify(a.geom, 0.000075) AS geom
FROM agglomerated a
)
,taskpolygonsnoindex as (
SELECT (st_dump(st_polygonize(s.geom))).geom AS geom
FROM simplifiedlines s
)
SELECT
row_number () over () as taskid,
tpni.*
FROM taskpolygonsnoindex tpni
);

-- ALTER TABLE taskpolygons ADD PRIMARY KEY(taskid);
SELECT Populate_Geometry_Columns('public.taskpolygons'::regclass);
CREATE INDEX taskpolygons_idx
ON taskpolygons
USING GIST (geom);
ON taskpolygons
USING GIST (geom);
-- VACUUM ANALYZE taskpolygons;


Expand Down
7 changes: 4 additions & 3 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -86,8 +86,6 @@ target-versions = ["py310", "py311"]
fix = true
line-length = 132
target-version = "py310"
select = ["I", "E", "W", "D", "B", "F", "N", "Q"]
ignore = ["N805", "B008"]
exclude = [
".git",
".ruff_cache",
Expand All @@ -97,7 +95,10 @@ exclude = [
"dist",
"fmtm_splitter/__version__.py",
]
[tool.ruff.pydocstyle]
[tool.ruff.lint]
select = ["I", "E", "W", "D", "B", "F", "N", "Q"]
ignore = ["N805", "B008"]
[tool.ruff.lint.pydocstyle]
convention = "google"

[project.scripts]
Expand Down
11 changes: 4 additions & 7 deletions tests/test_splitter.py
Original file line number Diff line number Diff line change
Expand Up @@ -143,7 +143,7 @@ def test_split_by_sql_fmtm_with_extract(db, aoi_json, extract_json, output_json)
num_buildings=5,
osm_extract=extract_json,
)
assert len(features.get("features")) == 122
assert len(features.get("features")) == 120
assert sorted(features) == sorted(output_json)


Expand Down Expand Up @@ -173,13 +173,10 @@ def test_split_by_sql_fmtm_multi_geom(extract_json):
assert isinstance(features, geojson.feature.FeatureCollection)
assert isinstance(features.get("features"), list)
assert isinstance(features.get("features")[0], dict)
assert len(features.get("features")) == 47

multipolygons = [feature for feature in features.get("features", []) if feature.get("geometry").get("type") == "MultiPolygon"]
assert len(multipolygons) == 2
assert len(features.get("features")) == 35

polygons = [feature for feature in features.get("features", []) if feature.get("geometry").get("type") == "Polygon"]
assert len(polygons) == 45
assert len(polygons) == 35

polygon_feat = geojson.loads(json.dumps(polygons[0]))
assert isinstance(polygon_feat, geojson.Feature)
Expand Down Expand Up @@ -258,7 +255,7 @@ def test_split_by_sql_cli():
with open(outfile, "r") as jsonfile:
output_geojson = geojson.load(jsonfile)

assert len(output_geojson.get("features")) == 62
assert len(output_geojson.get("features")) == 60


def test_split_by_sql_cli_no_extract():
Expand Down
Loading