-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathnbgeohash.py
135 lines (120 loc) · 4.48 KB
/
nbgeohash.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
import numpy as np
import numba as nb
from numba import njit, types
from math import log10
@njit(cache=True, fastmath=True)
def base32_to_int(s: types.char) -> types.uint8:
"""
Returns the equivalent value of a base 32 character.
Surprisingly, on Numba this approach is faster than all the others.
"""
res = ord(s) - 48
if res > 9: res -= 40
if res > 16: res -= 1
if res > 18: res -= 1
if res > 20: res -= 1
return res
@njit(fastmath=True)
def nb_decode_exactly(geohash: types.string) -> types.Tuple:
"""
Decode the geohash to its exact values, including the error
margins of the result. Returns four float values: latitude,
longitude, the plus/minus error for latitude (as a positive
number) and the plus/minus error for longitude (as a positive
number).
"""
lat_interval_neg, lat_interval_pos, lon_interval_neg, lon_interval_pos = -90, 90, -180, 180
lat_err, lon_err = 90, 180
masks = np.array([16, 8, 4, 2, 1])
is_even = True
for c in geohash:
cd = base32_to_int(c)
for mask in masks:
if is_even: # adds longitude info
lon_err /= 2
if cd & mask:
lon_interval_neg = (lon_interval_neg +
lon_interval_pos) / 2
else:
lon_interval_pos = (lon_interval_neg +
lon_interval_pos) / 2
else: # adds latitude info
lat_err /= 2
if cd & mask:
lat_interval_neg = (lat_interval_neg +
lat_interval_pos) / 2
else:
lat_interval_pos = (lat_interval_neg +
lat_interval_pos) / 2
is_even = not is_even
lat = (lat_interval_neg + lat_interval_pos) / 2
lon = (lon_interval_neg + lon_interval_pos) / 2
return lat, lon, lat_err, lon_err
@njit(fastmath=True)
def nb_point_decode(geohash: types.string) -> types.Tuple:
"""
Decode geohash, returning two float with latitude and longitude containing only relevant digits.
"""
lat, lon, lat_err, lon_err = nb_decode_exactly(geohash)
# Format to the number of decimals that are known
lat_dec = max(1, round(-log10(lat_err))) - 1
lon_dec = max(1, round(-log10(lon_err))) - 1
lat = round(lat, lat_dec)
lon = round(lon, lon_dec)
return lat, lon
@njit(fastmath=True, parallel=True)
def nb_vector_decode(geohashes: types.Array) -> types.Tuple:
"""
Decode geohashes, returning two Arrays of floats with latitudes and longitudes containing only relevant digits.
"""
n = len(geohashes)
lats = np.empty(n)
lons = np.empty(n)
for i, geohash in enumerate(geohashes):
lat, lon, lat_err, lon_err = nb_decode_exactly(str(geohash))
# Format to the number of decimals that are known
lat_dec = max(1, round(-log10(lat_err))) - 1
lon_dec = max(1, round(-log10(lon_err))) - 1
lats[i] = round(lat, lat_dec)
lons[i] = round(lon, lon_dec)
return lats, lons
@njit(fastmath=True)
def nb_point_encode(latitude: types.float64, longitude: types.float64, precision: types.int8 = 12) -> types.string:
base32 = '0123456789bcdefghjkmnpqrstuvwxyz'
lat_interval_neg, lat_interval_pos, lon_interval_neg, lon_interval_pos = -90, 90, -180, 180
geohash = np.zeros(precision, dtype='<U1')
bits = np.array([16, 8, 4, 2, 1])
bit = 0
ch = 0
n = 0
even = True
while n < precision:
mid = (lon_interval_neg + lon_interval_pos) / 2
if even:
if longitude > mid:
ch |= bits[bit]
lon_interval_neg = mid
else:
lon_interval_pos = mid
else:
if latitude > mid:
ch |= bits[bit]
lat_interval_neg = mid
else:
lat_interval_pos = mid
even = not even
if bit < 4:
bit += 1
else:
geohash[n] = base32[ch]
bit = 0
ch = 0
n += 1
return ''.join(geohash)
@njit(fastmath=True, parallel=True)
def nb_vector_encode(latitudes: types.Array, longitudes: types.Array, precision: types.int8 = 12) -> types.Array:
n = len(latitudes)
geohashes = np.empty(n, dtype='<U12')
for i in range(n):
geohashes[i] = nb_point_encode(latitudes[i], longitudes[i], precision)
return geohashes