I have a set of ~36,000 polygons which represent a partition (~counties) of the country.
My python script receives a lot of points: pointId, longitude, latitude.
For each point, I want to send back pointId, polygonId.
For each point, looping into all the polygons and use myPoint.within(myPolygon) is quite inefficient.
I suppose the shapely library offers a better way to prepare the polygon so that finding the polygon for a point becomes a tree path (country, region, sub region, ...)
Here is my code so far:
import sys
import os
import json
import time
import string
import uuid
py_id = str(uuid.uuid4())
sys.stderr.write(py_id + '
')
sys.stderr.write('point_in_polygon.py V131130a.
')
sys.stderr.flush()
from shapely.geometry import Point
from shapely.geometry import Polygon
import sys
import json
import string
import uuid
import time
jsonpath='.cantons.json'
jsonfile = json.loads(open(jsonpath).read())
def find(id, obj):
results = []
def _find_values(id, obj):
try:
for key, value in obj.iteritems():
if key == id:
results.append(value)
elif not isinstance(value, basestring):
_find_values(id, value)
except AttributeError:
pass
try:
for item in obj:
if not isinstance(item, basestring):
_find_values(id, item)
except TypeError:
pass
if not isinstance(obj, basestring):
_find_values(id, obj)
return results
#1-Load polygons from json
r=find('rings',jsonfile)
len_r = len(r)
#2-Load attributes from json
a=find('attributes',jsonfile)
def insidePolygon(point,json):
x=0
while x < len_r :
y=0
while y < len(r[x]) :
p=Polygon(r[x][y])
if(point.within(p)):
return a[y]['OBJECTID'],a[y]['NAME_5']
y=y+1
x=x+1
return None,None
while True:
line = sys.stdin.readline()
if not line:
break
try:
args, tobedropped = string.split(line, "
", 2)
#input: vehicleId, longitude, latitude
vehicleId, longitude, latitude = string.split(args, "")
point = Point(float(longitude), float(latitude))
cantonId,cantonName = insidePolygon(point,r)
#output: vehicleId, cantonId, cantonName
# vehicleId will be 0 if not found
# vehicleId will be < 0 in case of an exception
if (cantonId == None):
print "".join(["0", "", ""])
else:
print "".join([str(vehicleId), str(cantonId), str(cantonName)])
except ValueError:
print "".join(["-1", "", ""])
sys.stderr.write(py_id + '
')
sys.stderr.write('ValueError in Python script
')
sys.stderr.write(line)
sys.stderr.flush()
except:
sys.stderr.write(py_id + '
')
sys.stderr.write('Exception in Python script
')
sys.stderr.write(str(sys.exc_info()[0]) + '
')
sys.stderr.flush()
print "".join(["-2", "", ""])
See Question&Answers more detail:
os