Skip to content

Commit

Permalink
fix(pivot2osm): OOM when selecting edges of pivot DB
Browse files Browse the repository at this point in the history
  • Loading branch information
azarz committed Feb 14, 2024
1 parent 95e2890 commit 364e94d
Show file tree
Hide file tree
Showing 2 changed files with 41 additions and 23 deletions.
11 changes: 8 additions & 3 deletions changelog.md
Original file line number Diff line number Diff line change
@@ -1,15 +1,20 @@
# CHANGELOG

## 2.2.3

CHANGED:
- Pivot to osm: Using batches for fetching edges in pivot DB

## 2.2.2

ADD:
- VACUUM ANALYSE is done only on created tables
- Templates for issues and PR
- Templates for issues and PR
- A code of conduct was adapted from the contributor covenant
- A contributing was added
- The DCO was added
- The DCO was added
- Restrict access to pedestrian ways according to BDTOPO
- Better handling of urbain column inside the BDTOPO
- Better handling of urbain column inside the BDTOPO

FIX:
- Durée de parcours incohérente sur OSRM entre car-fastest et car-shortest
Expand Down
53 changes: 33 additions & 20 deletions r2gg/_pivot_to_osm.py
Original file line number Diff line number Diff line change
Expand Up @@ -90,31 +90,44 @@ def pivot_to_osm(config, source, db_configs, connection, logger, output_is_pbf =
et_execute = time.time()
logger.info("Writing nodes ended. Elapsed time : %s seconds." %(et_execute - st_execute))

# Ecriture des ways
sql_query2 = getQueryByTableAndBoundingBox(f'{input_schema}.edges', source['bbox'], ['*', f'{input_schema}.inter_nodes(geom) as internodes'])
logger.info("SQL: {}".format(sql_query2))
# Récupération du nombre de ways
sql_query = f"SELECT COUNT(*) as cnt FROM {input_schema}.edges"
logger.info("SQL: {}".format(sql_query))
st_execute = time.time()
cursor.execute(sql_query2)
cursor.execute(sql_query)
et_execute = time.time()
logger.info("Execution ended. Elapsed time : %s seconds." %(et_execute - st_execute))
row = cursor.fetchone()
logger.info("Writing ways")
edgesize = row["cnt"]

# Ecriture des ways
batchsize = 500000
offset = 0
logger.info(f"Writing ways: {edgesize} ways to write")
st_execute = time.time()
i = 1
while row:
wayEl = writeWay(row, extraction_date)
for node in row['internodes']:
vertexSequence = vertexSequence + 1
node['id'] = vertexSequence
nodeEl = writeNode(node, extraction_date)
xf.write(nodeEl, pretty_print=True)
wayEl = writeWayNds(wayEl, row, row['internodes'])
wayEl = writeWayTags(wayEl, row)
xf.write(wayEl, pretty_print=True)
row = cursor.fetchone()
if (i % ceil(cursor.rowcount/10) == 0):
logger.info("%s / %s ways ajoutés" %(i, cursor.rowcount))
i += 1
while offset < edgesize:
sql_query2 = getQueryByTableAndBoundingBox(f'{input_schema}.edges', source['bbox'], ['*', f'{input_schema}.inter_nodes(geom) as internodes'])
sql_query2 += " LIMIT {} OFFSET {}".format(batchsize, offset)
logger.info("SQL: {}".format(sql_query2))
cursor.execute(sql_query2)
et_execute = time.time()
offset += batchsize
logger.info("Execution ended. Elapsed time : %s seconds." %(et_execute - st_execute))
row = cursor.fetchone()
st_execute = time.time()
i = 1
while row:
wayEl = writeWay(row, extraction_date)
for node in row['internodes']:
vertexSequence = vertexSequence + 1
node['id'] = vertexSequence
nodeEl = writeNode(node, extraction_date)
xf.write(nodeEl, pretty_print=True)
wayEl = writeWayNds(wayEl, row, row['internodes'])
wayEl = writeWayTags(wayEl, row)
xf.write(wayEl, pretty_print=True)
row = cursor.fetchone()
logger.info("%s / %s ways ajoutés" %(offset, edgesize))
et_execute = time.time()
logger.info("Writing ways ended. Elapsed time : %s seconds." %(et_execute - st_execute))

Expand Down

0 comments on commit 364e94d

Please sign in to comment.