chore: move obs_process_track.py into the API source, as it is very specific to the API

2021-10-10 09:42:47 +02:00 · 2021-10-10 09:42:47 +02:00 · 4742a6df13
parent e74d2c9130
commit 4742a6df13
3 changed files with 148 additions and 3 deletions
--- a/api/src/paths.js
+++ b/api/src/paths.js
@ -1,5 +1,7 @@
 const path = require('path');

+const API_ROOT_DIR = path.resolve(__dirname, '../');
+
 const DATA_DIR = process.env.DATA_DIR || path.resolve(__dirname, '../../data/');

 // Contains the subtree for processing files
@ -23,4 +25,4 @@ module.exports = {
  PROCESSING_DIR_PRIVATE,
  TRACKS_DIR,
  OBS_FACE_CACHE_DIR,
-}
+};
--- a/api/src/process_track.py
+++ b/api/src/process_track.py
@ -0,0 +1,142 @@
+import argparse
+import logging
+import os
+import tempfile
+import json
+
+from obs.face.importer import ImportMeasurementsCsv
+from obs.face.annotate import AnnotateMeasurements
+from obs.face.filter import MeasurementFilter
+from obs.face.geojson import ExportMeasurements, ExportRoadAnnotation
+from obs.face.osm import DataSource as OSMDataSource
+from obs.face.filter import PrivacyFilter
+
+log = logging.getLogger(__name__)
+
+
+def main():
+    logging.basicConfig(level=logging.DEBUG, format="%(levelname)s: %(message)s")
+
+    parser = argparse.ArgumentParser(
+        description="processes a single track for use in the portal, "
+        "using the obs.face algorithms"
+    )
+
+    parser.add_argument(
+        "-i", "--input", required=True, action="store", help="path to input CSV file"
+    )
+    parser.add_argument(
+        "-o", "--output", required=True, action="store", help="path to output directory"
+    )
+    parser.add_argument(
+        "--path-cache",
+        action="store",
+        default=None,
+        dest="cache_dir",
+        help="path where the visualization data will be stored",
+    )
+
+    args = parser.parse_args()
+
+    if args.cache_dir is None:
+        with tempfile.TemporaryDirectory() as cache_dir:
+            args.cache_dir = cache_dir
+            process(args)
+    else:
+        process(args)
+
+
+def process(args):
+    log.info("Loading OpenStreetMap data")
+    osm = OSMDataSource(cache_dir=args.cache_dir)
+
+    filename_input = os.path.abspath(args.input)
+    dataset_id = os.path.splitext(os.path.basename(args.input))[0]
+
+    os.makedirs(args.output, exist_ok=True)
+
+    filename_log = os.path.join(args.output, f"{dataset_id}.log")
+
+    log.info("Annotating and filtering CSV file")
+    with open(filename_log, "w") as logfile:
+        measurements, statistics = ImportMeasurementsCsv().read(
+            filename_input,
+            user_id="dummy",
+            dataset_id=dataset_id,
+            log=logfile,
+        )
+        measurements = AnnotateMeasurements(osm, cache_dir=args.cache_dir).annotate(measurements)
+        confirmed_measurements = MeasurementFilter().filter(measurements, log=logfile)
+        valid_measurements = MeasurementFilter(remove_unconfirmed=False).filter(measurements, log=logfile)
+
+    # write out
+    confirmed_measurements_json = {
+        "type": "FeatureCollection",
+        "features": [
+            {
+                "type": "Feature",
+                "geometry": {
+                    "type": "Point",
+                    "coordinates": [m["latitude"], m["longitude"]],
+                },
+                "properties": {
+                    "distanceOvertaker": m["distance_overtaker"],
+                    "distanceStationary": m["distance_stationary"],
+                    "confirmed": True,
+                },
+            }
+            for m in confirmed_measurements
+        ],
+    }
+    all_measurements_json = {
+        "type": "FeatureCollection",
+        "features": [
+            {
+                "type": "Feature",
+                "geometry": {
+                    "type": "Point",
+                    "coordinates": [m["latitude"], m["longitude"]],
+                },
+                "properties": {
+                    "distanceOvertaker": m["distance_overtaker"],
+                    "distanceStationary": m["distance_stationary"],
+                    "confirmed": m in confirmed_measurements,
+                },
+            }
+            for m in valid_measurements
+            if m["distance_overtaker"] or m["distance_stationary"]
+        ],
+    }
+
+    track_json = {
+        "type": "Feature",
+        "geometry": {
+            "type": "LineString",
+            "coordinates": [
+                [m["latitude"], m["longitude"]] for m in valid_measurements
+            ],
+        },
+    }
+
+    statistics_json = {
+        "recordedAt": statistics['t_min'].isoformat(),
+        "recordedUntil": statistics['t_max'].isoformat(),
+        "duration": statistics['t'],
+        "length": statistics['d'],
+        "segments": statistics['n_segments'],
+        "numEvents": statistics['n_confirmed'],
+        "numMeasurements": statistics['n_measurements'],
+        "numValid": statistics['n_valid'],
+    }
+
+    for output_filename, data in [
+        ("all_measurements.json", all_measurements_json),
+        ("confirmed_measurements.json", confirmed_measurements_json),
+        ("track.json", track_json),
+        ("statistics.json", statistics_json),
+    ]:
+        with open(os.path.join(args.output, output_filename), 'w') as fp:
+            json.dump(data, fp, indent=4)
+
+if __name__ == "__main__":
+    main()
--- a/api/src/worker.js
+++ b/api/src/worker.js
@ -5,7 +5,7 @@ const { spawn } = require('child_process');
 const queue = require('./queue');
 require('./db');
 const { Track } = require('./models');
-const { PROCESSING_DIR, OBS_FACE_CACHE_DIR, PROCESSING_OUTPUT_DIR } = require('./paths');
+const { API_ROOT_DIR, PROCESSING_DIR, OBS_FACE_CACHE_DIR, PROCESSING_OUTPUT_DIR } = require('./paths');

 queue.process('processTrack', async (job) => {
  const track = await Track.findById(job.data.trackId);
@ -55,8 +55,9 @@ queue.process('processTrack', async (job) => {
    // TODO: Generate track transformation settings (privacy zones etc)
    // const settingsFilePath = path.join(inputDirectory, 'track-settings.json');
    const child = spawn(
-      'obs-process-track',
+      'python',
      [
+        path.join(API_ROOT_DIR, 'src', 'process_track.py'),
        '--input',
        inputFilePath,
        '--output',