Evan Siroky | 8b47abe | 2016-10-02 12:28:52 -0700 | [diff] [blame] | 1 | var exec = require('child_process').exec, |
| 2 | fs = require('fs'), |
evansiroky | d401c89 | 2016-06-16 00:05:14 -0700 | [diff] [blame] | 3 | http = require('http') |
| 4 | |
| 5 | var async = require('async'), |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 6 | jsts = require('jsts'), |
Evan Siroky | 8e30a2e | 2016-08-06 19:55:35 -0700 | [diff] [blame] | 7 | multiPolygon = require('turf-multipolygon'), |
evansiroky | d401c89 | 2016-06-16 00:05:14 -0700 | [diff] [blame] | 8 | overpass = require('query-overpass'), |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 9 | polygon = require('turf-polygon'), |
evansiroky | d401c89 | 2016-06-16 00:05:14 -0700 | [diff] [blame] | 10 | shp = require('shpjs') |
| 11 | |
| 12 | |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 13 | var osmBoundarySources = require('./osmBoundarySources.json'), |
evansiroky | 50216c6 | 2016-06-16 17:41:47 -0700 | [diff] [blame] | 14 | zoneCfg = require('./timezones.json'), |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 15 | geoJsonReader = new jsts.io.GeoJSONReader(), |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 16 | geoJsonWriter = new jsts.io.GeoJSONWriter(), |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 17 | distZones = {} |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 18 | |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 19 | var safeMkdir = function(dirname, callback) { |
| 20 | fs.mkdir(dirname, function(err) { |
| 21 | if(err && err.code === 'EEXIST') { |
| 22 | callback() |
| 23 | } else { |
| 24 | callback(err) |
| 25 | } |
| 26 | }) |
| 27 | } |
| 28 | |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 29 | debugGeo = function(op, a, b) { |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 30 | |
| 31 | var result |
| 32 | |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 33 | try { |
| 34 | switch(op) { |
| 35 | case 'union': |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 36 | result = a.union(b) |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 37 | break |
| 38 | case 'intersection': |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 39 | result = a.intersection(b) |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 40 | break |
| 41 | case 'diff': |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 42 | try { |
| 43 | result = a.difference(b) |
| 44 | } catch(e) { |
| 45 | if(e.name === 'TopologyException') { |
| 46 | console.log('retry with GeometryPrecisionReducer') |
Evan Siroky | 783532d | 2016-07-07 16:44:01 -0700 | [diff] [blame] | 47 | var precisionModel = new jsts.geom.PrecisionModel(10000), |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 48 | precisionReducer = new jsts.precision.GeometryPrecisionReducer(precisionModel) |
| 49 | |
| 50 | a = precisionReducer.reduce(a) |
| 51 | b = precisionReducer.reduce(b) |
| 52 | |
| 53 | result = a.difference(b) |
| 54 | } else { |
| 55 | throw e |
| 56 | } |
| 57 | } |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 58 | break |
| 59 | default: |
| 60 | var err = new Error('invalid op: ' + op) |
| 61 | throw err |
| 62 | } |
| 63 | } catch(e) { |
| 64 | console.log('op err') |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 65 | console.log(e) |
| 66 | console.log(e.stack) |
| 67 | fs.writeFileSync('debug_' + op + '_a.json', JSON.stringify(geoJsonWriter.write(a))) |
| 68 | fs.writeFileSync('debug_' + op + '_b.json', JSON.stringify(geoJsonWriter.write(b))) |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 69 | throw e |
| 70 | } |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 71 | |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 72 | return result |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 73 | } |
| 74 | |
evansiroky | 50216c6 | 2016-06-16 17:41:47 -0700 | [diff] [blame] | 75 | var fetchIfNeeded = function(file, superCallback, fetchFn) { |
| 76 | fs.stat(file, function(err) { |
| 77 | if(!err) { return superCallback() } |
| 78 | fetchFn() |
| 79 | }) |
| 80 | } |
| 81 | |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 82 | var geoJsonToGeom = function(geoJson) { |
| 83 | return geoJsonReader.read(JSON.stringify(geoJson)) |
| 84 | } |
| 85 | |
Evan Siroky | 8b47abe | 2016-10-02 12:28:52 -0700 | [diff] [blame] | 86 | var geomToGeoJson = function (geom) { |
| 87 | return geoJsonWriter.write(geom) |
| 88 | } |
| 89 | |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 90 | var geomToGeoJsonString = function(geom) { |
| 91 | return JSON.stringify(geoJsonWriter.write(geom)) |
| 92 | } |
| 93 | |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 94 | var downloadOsmBoundary = function(boundaryId, boundaryCallback) { |
| 95 | var cfg = osmBoundarySources[boundaryId], |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 96 | query = '[out:json][timeout:60];(relation', |
| 97 | boundaryFilename = './downloads/' + boundaryId + '.json', |
| 98 | debug = 'getting data for ' + boundaryId, |
| 99 | queryKeys = Object.keys(cfg) |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 100 | |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 101 | for (var i = queryKeys.length - 1; i >= 0; i--) { |
| 102 | var k = queryKeys[i], |
| 103 | v = cfg[k] |
| 104 | |
| 105 | query += '["' + k + '"="' + v + '"]' |
| 106 | |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 107 | } |
| 108 | |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 109 | query += ');out body;>;out meta qt;' |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 110 | |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 111 | console.log(debug) |
| 112 | |
| 113 | async.auto({ |
evansiroky | 5d00813 | 2016-06-17 08:37:51 -0700 | [diff] [blame] | 114 | downloadFromOverpass: function(cb) { |
evansiroky | 50216c6 | 2016-06-16 17:41:47 -0700 | [diff] [blame] | 115 | console.log('downloading from overpass') |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 116 | fetchIfNeeded(boundaryFilename, boundaryCallback, function() { |
evansiroky | 50216c6 | 2016-06-16 17:41:47 -0700 | [diff] [blame] | 117 | overpass(query, cb, { flatProperties: true }) |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 118 | }) |
| 119 | }, |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 120 | validateOverpassResult: ['downloadFromOverpass', function(results, cb) { |
| 121 | var data = results.downloadFromOverpass |
| 122 | if(!data.features || data.features.length == 0) { |
| 123 | err = new Error('Invalid geojson for boundary: ' + boundaryId) |
| 124 | return cb(err) |
| 125 | } |
| 126 | cb() |
| 127 | }], |
| 128 | saveSingleMultiPolygon: ['validateOverpassResult', function(results, cb) { |
| 129 | var data = results.downloadFromOverpass, |
| 130 | combined |
| 131 | |
| 132 | // union all multi-polygons / polygons into one |
| 133 | for (var i = data.features.length - 1; i >= 0; i--) { |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 134 | var curOsmGeom = data.features[i].geometry |
| 135 | if(curOsmGeom.type === 'Polygon' || curOsmGeom.type === 'MultiPolygon') { |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 136 | console.log('combining border') |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 137 | var curGeom = geoJsonToGeom(curOsmGeom) |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 138 | if(!combined) { |
| 139 | combined = curGeom |
| 140 | } else { |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 141 | combined = debugGeo('union', curGeom, combined) |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 142 | } |
| 143 | } |
| 144 | } |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 145 | fs.writeFile(boundaryFilename, geomToGeoJsonString(combined), cb) |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 146 | }] |
| 147 | }, boundaryCallback) |
| 148 | } |
evansiroky | d401c89 | 2016-06-16 00:05:14 -0700 | [diff] [blame] | 149 | |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 150 | var getTzDistFilename = function (tzid) { |
| 151 | return './dist/' + tzid.replace(/\//g, '__') + '.json' |
| 152 | } |
| 153 | |
| 154 | /** |
| 155 | * Get the geometry of the requested source data |
| 156 | * |
| 157 | * @return {Object} geom The geometry of the source |
| 158 | * @param {Object} source An object representing the data source |
| 159 | * must have `source` key and then either: |
| 160 | * - `id` if from a file |
| 161 | * - `id` if from a file |
| 162 | */ |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 163 | var getDataSource = function(source) { |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 164 | var geoJson |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 165 | if(source.source === 'overpass') { |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 166 | geoJson = require('./downloads/' + source.id + '.json') |
evansiroky | 35f6434 | 2016-06-16 22:17:04 -0700 | [diff] [blame] | 167 | } else if(source.source === 'manual-polygon') { |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 168 | geoJson = polygon(source.data).geometry |
Evan Siroky | 8e30a2e | 2016-08-06 19:55:35 -0700 | [diff] [blame] | 169 | } else if(source.source === 'manual-multipolygon') { |
| 170 | geoJson = multiPolygon(source.data).geometry |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 171 | } else if(source.source === 'dist') { |
| 172 | geoJson = require(getTzDistFilename(source.id)) |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 173 | } else { |
| 174 | var err = new Error('unknown source: ' + source.source) |
| 175 | throw err |
| 176 | } |
Evan Siroky | 5669adc | 2016-07-07 17:25:31 -0700 | [diff] [blame] | 177 | return geoJsonToGeom(geoJson) |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 178 | } |
| 179 | |
| 180 | var makeTimezoneBoundary = function(tzid, callback) { |
evansiroky | 35f6434 | 2016-06-16 22:17:04 -0700 | [diff] [blame] | 181 | console.log('makeTimezoneBoundary for', tzid) |
| 182 | |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 183 | var ops = zoneCfg[tzid], |
| 184 | geom |
| 185 | |
| 186 | async.eachSeries(ops, function(task, cb) { |
| 187 | var taskData = getDataSource(task) |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 188 | console.log('-', task.op, task.id) |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 189 | if(task.op === 'init') { |
| 190 | geom = taskData |
| 191 | } else if(task.op === 'intersect') { |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 192 | geom = debugGeo('intersection', geom, taskData) |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 193 | } else if(task.op === 'difference') { |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 194 | geom = debugGeo('diff', geom, taskData) |
Evan Siroky | 8ccaf0b | 2016-09-03 11:36:13 -0700 | [diff] [blame] | 195 | } else if(task.op === 'difference-reverse-order') { |
| 196 | geom = debugGeo('diff', taskData, geom) |
evansiroky | 6e45be6 | 2016-06-17 08:46:28 -0700 | [diff] [blame] | 197 | } else if(task.op === 'union') { |
evansiroky | 6f9d8f7 | 2016-06-21 16:27:54 -0700 | [diff] [blame] | 198 | geom = debugGeo('union', geom, taskData) |
Evan Siroky | 8ccaf0b | 2016-09-03 11:36:13 -0700 | [diff] [blame] | 199 | } else { |
| 200 | var err = new Error('unknown op: ' + task.op) |
| 201 | return cb(err) |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 202 | } |
evansiroky | 35f6434 | 2016-06-16 22:17:04 -0700 | [diff] [blame] | 203 | cb() |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 204 | }, |
| 205 | function(err) { |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 206 | if(err) { return callback(err) } |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 207 | fs.writeFile(getTzDistFilename(tzid), |
| 208 | geomToGeoJsonString(geom), |
evansiroky | becb56e | 2016-07-06 12:42:35 -0700 | [diff] [blame] | 209 | callback) |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 210 | }) |
| 211 | } |
| 212 | |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 213 | var loadDistZonesIntoMemory = function () { |
| 214 | console.log('load zones into memory') |
| 215 | var zones = Object.keys(zoneCfg), |
| 216 | tzid |
| 217 | |
| 218 | for (var i = 0; i < zones.length; i++) { |
| 219 | tzid = zones[i] |
| 220 | distZones[tzid] = getDataSource({ source: 'dist', id: tzid }) |
| 221 | } |
| 222 | } |
| 223 | |
| 224 | var getDistZoneGeom = function (tzid) { |
| 225 | return distZones[tzid] |
| 226 | } |
| 227 | |
| 228 | var validateTimezoneBoundaries = function () { |
| 229 | console.log('do validation') |
| 230 | var allZonesOk = true, |
| 231 | zones = Object.keys(zoneCfg), |
| 232 | compareTzid, tzid, zoneGeom |
| 233 | |
| 234 | for (var i = 0; i < zones.length; i++) { |
| 235 | tzid = zones[i] |
| 236 | zoneGeom = getDistZoneGeom(tzid) |
| 237 | |
| 238 | for (var j = i + 1; j < zones.length; j++) { |
| 239 | compareTzid = zones[j] |
| 240 | |
| 241 | var compareZoneGeom = getDistZoneGeom(compareTzid) |
| 242 | if(zoneGeom.intersects(compareZoneGeom)) { |
| 243 | var intersectedGeom = debugGeo('intersection', zoneGeom, compareZoneGeom), |
| 244 | intersectedArea = intersectedGeom.getArea() |
| 245 | |
| 246 | if(intersectedArea > 0.0001) { |
| 247 | console.log('Validation error: ' + tzid + ' intersects ' + compareTzid + ' area: ' + intersectedArea) |
| 248 | allZonesOk = false |
| 249 | } |
| 250 | } |
| 251 | } |
| 252 | } |
| 253 | |
| 254 | return allZonesOk ? null : 'Zone validation unsuccessful' |
| 255 | |
| 256 | } |
| 257 | |
Evan Siroky | 8b47abe | 2016-10-02 12:28:52 -0700 | [diff] [blame] | 258 | var combineAndWriteZones = function(callback) { |
| 259 | var stream = fs.createWriteStream('./dist/combined.json') |
| 260 | var zones = Object.keys(zoneCfg) |
| 261 | |
| 262 | stream.write('{"type":"FeatureCollection","features":[') |
| 263 | |
| 264 | for (var i = 0; i < zones.length; i++) { |
| 265 | if(i > 0) { |
| 266 | stream.write(',') |
| 267 | } |
| 268 | var feature = { |
| 269 | type: 'Feature', |
| 270 | properties: { tzid: zones[i] }, |
| 271 | geometry: geomToGeoJson(getDistZoneGeom(zones[i])) |
| 272 | } |
| 273 | stream.write(JSON.stringify(feature)) |
| 274 | } |
| 275 | stream.end(']}', callback) |
| 276 | } |
| 277 | |
evansiroky | d401c89 | 2016-06-16 00:05:14 -0700 | [diff] [blame] | 278 | async.auto({ |
| 279 | makeDownloadsDir: function(cb) { |
| 280 | console.log('creating downloads dir') |
evansiroky | 4be1c7a | 2016-06-16 18:23:34 -0700 | [diff] [blame] | 281 | safeMkdir('./downloads', cb) |
| 282 | }, |
| 283 | makeDistDir: function(cb) { |
| 284 | console.log('createing dist dir') |
| 285 | safeMkdir('./dist', cb) |
evansiroky | d401c89 | 2016-06-16 00:05:14 -0700 | [diff] [blame] | 286 | }, |
evansiroky | d401c89 | 2016-06-16 00:05:14 -0700 | [diff] [blame] | 287 | getOsmBoundaries: ['makeDownloadsDir', function(results, cb) { |
| 288 | console.log('downloading osm boundaries') |
evansiroky | 63d35e1 | 2016-06-16 10:08:15 -0700 | [diff] [blame] | 289 | async.eachSeries(Object.keys(osmBoundarySources), downloadOsmBoundary, cb) |
| 290 | }], |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 291 | createZones: ['makeDistDir', 'getOsmBoundaries', function(results, cb) { |
evansiroky | 35f6434 | 2016-06-16 22:17:04 -0700 | [diff] [blame] | 292 | console.log('createZones') |
evansiroky | 50216c6 | 2016-06-16 17:41:47 -0700 | [diff] [blame] | 293 | async.each(Object.keys(zoneCfg), makeTimezoneBoundary, cb) |
| 294 | }], |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 295 | validateZones: ['createZones', function(results, cb) { |
| 296 | console.log('validating zones') |
| 297 | loadDistZonesIntoMemory() |
| 298 | cb(validateTimezoneBoundaries()) |
| 299 | }], |
| 300 | mergeZones: ['validateZones', function(results, cb) { |
Evan Siroky | 8b47abe | 2016-10-02 12:28:52 -0700 | [diff] [blame] | 301 | console.log('merge zones') |
| 302 | combineAndWriteZones(cb) |
| 303 | }], |
| 304 | zipGeoJson: ['mergeZones', function (results, cb) { |
| 305 | console.log('zip geojson') |
| 306 | exec('zip dist/timezones.geojson.zip dist/combined.json', cb) |
| 307 | }], |
| 308 | makeShapefile: ['mergeZones', function (results, cb) { |
| 309 | console.log('convert from geojson to shapefile') |
| 310 | exec('ogr2ogr -nlt MULTIPOLYGON dist/combined_shapefile.shp dist/combined.json OGRGeoJSON', function (err, stdout, stderr) { |
| 311 | if(err) { return cb(err) } |
| 312 | exec('zip dist/timezones.shapefile.zip dist/combined_shapefile.*', cb) |
| 313 | }) |
evansiroky | d401c89 | 2016-06-16 00:05:14 -0700 | [diff] [blame] | 314 | }] |
evansiroky | 50216c6 | 2016-06-16 17:41:47 -0700 | [diff] [blame] | 315 | }, function(err, results) { |
evansiroky | d401c89 | 2016-06-16 00:05:14 -0700 | [diff] [blame] | 316 | console.log('done') |
| 317 | if(err) { |
| 318 | console.log('error!', err) |
| 319 | return |
| 320 | } |
Evan Siroky | 4fc596c | 2016-09-25 19:52:30 -0700 | [diff] [blame] | 321 | }) |