Merge pull request #1057 from debrief/for_release

Prepare new release
debrief · Oct 7, 2021 · bb479c5 · bb479c5
2 parents 7b294aa + 15286bc
commit bb479c5
Show file tree

Hide file tree

Showing 28 changed files with 914 additions and 110 deletions.
diff --git a/.github/workflows/test_pepys.yml b/.github/workflows/test_pepys.yml
@@ -56,12 +56,12 @@ jobs:
       - name: Run black
         shell: bash -l {0}
         run: |
-          black --check --diff importers pepys_import pepys_admin
+          black --check --diff importers pepys_import pepys_admin pepys_timeline tests
 
       - name: Run isort
         shell: bash -l {0}
         run: |
-          isort --check-only --diff importers pepys_import pepys_admin
+          isort --check-only --diff importers pepys_import pepys_admin pepys_timeline tests
 
       - name: Get coverage report
         shell: bash -l {0}

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -1,6 +1,6 @@
 repos:
   - repo: https://github.com/python/black
-    rev: 20.8b1
+    rev: 21.9b0
     hooks:
       - id: black
         language_version: python3

diff --git a/HISTORY.rst b/HISTORY.rst
@@ -2,6 +2,12 @@
 History
 =======
 
+0.0.30 (2021-10-05)
+-------------------
+
+* Incorporate Link16 importer
+* Include some performance upgrades, esp for Pepys-Admin
+
 0.0.29 (2021-09-29)
 -------------------
 

diff --git a/importers/link_16_importer.py b/importers/link_16_importer.py
@@ -0,0 +1,251 @@
+import os
+import re
+from datetime import datetime, timedelta
+
+from tqdm import tqdm
+
+from pepys_import.core.formats import unit_registry
+from pepys_import.core.formats.location import Location
+from pepys_import.core.validators import constants
+from pepys_import.file.highlighter.support.combine import combine_tokens
+from pepys_import.file.importer import CANCEL_IMPORT, Importer
+from pepys_import.utils.sqlalchemy_utils import get_lowest_privacy
+from pepys_import.utils.text_formatting_utils import (
+    custom_print_formatted_text,
+    format_error_message,
+)
+from pepys_import.utils.unit_utils import convert_absolute_angle, convert_distance, convert_speed
+
+V1_HEADER = "PPLI"
+V2_HEADER = "Xmt/Rcv"
+
+
+class Link16Importer(Importer):
+    """Importer to handle two different formats of track information that are
+    transmitted using Link-16 encoding
+    """
+
+    def __init__(self):
+        super().__init__(
+            name="Link-16 Format Importer",
+            validation_level=constants.BASIC_LEVEL,
+            short_name="Link-16 Importer",
+            default_privacy="Private",
+            datafile_type="Link-16",
+        )
+        self.version = 1
+
+    def can_load_this_type(self, suffix):
+        return suffix.upper() == ".CSV"
+
+    def can_load_this_filename(self, filename):
+        return True
+
+    def can_load_this_header(self, header):
+        # V1 starts w/ PPLI
+        # V2 starts w/ Xmt/Rcv
+        return header.startswith(V1_HEADER) or header.startswith(V2_HEADER)
+
+    def can_load_this_file(self, file_contents):
+        return True
+
+    def _load_this_file(self, data_store, path, file_object, datafile, change_id):
+        # Read the base timestamp from the filename
+        filename, _ = os.path.splitext(os.path.basename(path))
+        datetime_string = self.extract_timestamp(filename)
+        if datetime_string is False:
+            self.errors.append(
+                {
+                    self.error_type: f"Error reading file {path}. Unable to read date from {datetime_string}"
+                }
+            )
+            return
+        self.base_timestamp = self.timestamp_to_datetime(datetime_string)
+        if self.base_timestamp is False:
+            self.errors.append(
+                {
+                    self.error_type: f"Error reading file {path}. Unable to read date from {datetime_string}"
+                }
+            )
+            return
+        self.current_hour = self.base_timestamp.hour
+        self.previous_time = timedelta(
+            hours=0, minutes=self.base_timestamp.minute, seconds=self.base_timestamp.second
+        )
+        # We only need to apply the date component as we've already applied the
+        # hours (if missing) and the timestamps in the file are not offset from
+        # the filename
+        self.date_offset = datetime(
+            year=self.base_timestamp.year,
+            month=self.base_timestamp.month,
+            day=self.base_timestamp.day,
+            hour=0,
+            minute=0,
+            second=0,
+        )
+
+        # Now do what we'd normally do on load
+        for line_number, line in enumerate(tqdm(file_object.lines()), 1):
+            result = self._load_this_line(data_store, line_number, line, datafile, change_id)
+            if result == CANCEL_IMPORT:
+                custom_print_formatted_text(
+                    format_error_message(f"Error in file caused cancellation of import of {path}")
+                )
+                break
+
+    def _load_this_line(self, data_store, line_number, line, datafile, change_id):
+        if line_number == 1:
+            # Will only parse if one of these headers found
+            self.version = 1 if line.text.startswith(V1_HEADER) else 2
+            return
+        tokens = line.tokens(line.CSV_TOKENISER, ",")
+        if len(tokens) <= 1:
+            # To skip over any blank lines
+            return
+
+        if self.version == 1:
+            if len(tokens) < 15:
+                self.errors.append(
+                    {self.error_type: f"Error on line {line_number}. Not enough tokens: {line}"}
+                )
+                return
+            name_token = tokens[2]
+            lat_degrees_token = tokens[8]
+            lon_degrees_token = tokens[7]
+            heading_token = tokens[11]
+            speed_token = tokens[12]
+            altitude_token = tokens[10]
+
+        elif self.version == 2:
+            if len(tokens) < 28:
+                self.errors.append(
+                    {self.error_type: f"Error on line {line_number}. Not enough tokens: {line}"}
+                )
+                return
+            name_token = tokens[4]
+            lat_degrees_token = tokens[13]
+            lon_degrees_token = tokens[14]
+            heading_token = tokens[16]
+            speed_token = tokens[17]
+            altitude_token = tokens[15]
+
+        time_token = tokens[1]
+        # Some files have HH:MM:SS.MS, others have MM:SS.MS so we need to handle both
+        time_parts = time_token.text.split(":")
+        if len(time_parts) == 3:
+            # We have HH:MM:SS.MS format
+            line_time = timedelta(
+                hours=int(time_parts[0]), minutes=int(time_parts[1]), seconds=float(time_parts[2])
+            )
+        elif len(time_parts) == 2:
+            # The time as MM:SS.MS as read in from the file
+            line_time = timedelta(
+                hours=0, minutes=int(time_token.text[:2]), seconds=float(time_token.text[3:])
+            )
+            # Now deal with the hour component
+            # Has time gone down from the last? If so, we've shifted an hour forwards
+            if line_time < self.previous_time:
+                self.current_hour += 1
+
+            self.previous_time = line_time
+            # Turn the time from MM:SS.MS to HH:MM:SS.MS
+            line_time += timedelta(hours=self.current_hour)
+        else:  # Incorrect time format
+            self.errors.append(
+                {
+                    self.error_type: f"Error on line {line_number}. Invalid timestamp {time_token.text}"
+                }
+            )
+            return
+
+        line_time += self.date_offset
+
+        time_token.record(self.name, "timestamp", line_time)
+
+        name_token.record(self.name, "vessel name", name_token.text)
+
+        platform = self.get_cached_platform(
+            data_store, platform_name=name_token.text, change_id=change_id
+        )
+
+        sensor_type = data_store.add_to_sensor_types("Location-Satellite", change_id=change_id).name
+        privacy = get_lowest_privacy(data_store)
+        sensor = platform.get_sensor(
+            data_store=data_store,
+            sensor_name="GPS",
+            sensor_type=sensor_type,
+            privacy=privacy,
+            change_id=change_id,
+        )
+        state = datafile.create_state(data_store, platform, sensor, line_time, self.short_name)
+
+        location = Location(errors=self.errors, error_type=self.error_type)
+        lat_success = location.set_latitude_decimal_degrees(lat_degrees_token.text)
+        lon_success = location.set_longitude_decimal_degrees(lon_degrees_token.text)
+        if lat_success and lon_success:
+            state.location = location
+            combine_tokens(lon_degrees_token, lat_degrees_token).record(
+                self.name, "location", state.location, "decimal degrees"
+            )
+
+        elevation_valid, elevation = convert_distance(
+            altitude_token.text, unit_registry.foot, line_number, self.errors, self.error_type
+        )
+
+        if elevation_valid:
+            state.elevation = elevation
+            altitude_token.record(self.name, "altitude", state.elevation)
+
+        heading_valid, heading = convert_absolute_angle(
+            heading_token.text, line_number, self.errors, self.error_type
+        )
+        if heading_valid:
+            state.heading = heading
+            heading_token.record(self.name, "heading", heading)
+
+        speed_valid, speed = convert_speed(
+            speed_token.text,
+            unit_registry.foot_per_second,
+            line_number,
+            self.errors,
+            self.error_type,
+        )
+        if speed_valid:
+            state.speed = speed
+            speed_token.record(self.name, "speed", speed)
+
+        datafile.flush_extracted_tokens()
+
+    @staticmethod
+    def extract_timestamp(filename):
+        """Extracts a Link-16 timestamp from an unmodified filename
+        :param filename: The Link-16 filename that contains a timestamp
+        :type filename: String
+        :return: The timestamp extracted from the filename
+        :rtype: String
+        """
+        # All the files we've seen have a double file extension (raw... and csv)
+        base_filename, _ = os.path.splitext(os.path.basename(filename))
+        base_filename, _ = os.path.splitext(base_filename)
+        # Timestamp could be anywhere in the filename, so find it
+        extracted_datetime = re.search(r"(\d+-\d+-\d+T\d+-\d+-\d+)", base_filename)
+        try:
+            return extracted_datetime.group(1)
+        except AttributeError:
+            return False
+
+    @staticmethod
+    def timestamp_to_datetime(timestamp_string):
+        """Converts a Link-16 formatted timestamp into a Python datetime
+        :param timestamp_string: The Link16 file timestamp (GMT/UTC/Zulu)
+        :type timestamp_string: String
+        :return: a datetime (GMT/UTC/Zulu) if conversion successful
+            or False if unsuccessful
+        :rtype: datetime | bool
+        """
+        timestamp_format = "%d-%m-%YT%H-%M-%S"
+        try:
+            res = datetime.strptime(timestamp_string, timestamp_format)
+        except ValueError:
+            return False
+        return res
diff --git a/migrations/latest_revisions.json b/migrations/latest_revisions.json
@@ -1,4 +1,4 @@
 {
-    "LATEST_SQLITE_VERSION": "feb548c7c6c0",
-    "LATEST_POSTGRES_VERSION": "4899e94653f1"
+    "LATEST_SQLITE_VERSION": "e5c78b6abb2f",
+    "LATEST_POSTGRES_VERSION": "40d8ee1342f2"
 }
diff --git a/migrations/postgres_versions/2021-09-29_40d8ee1342f2_add_indexes.py b/migrations/postgres_versions/2021-09-29_40d8ee1342f2_add_indexes.py
@@ -0,0 +1,52 @@
+"""Add indexes
+
+Revision ID: 40d8ee1342f2
+Revises: 4899e94653f1
+Create Date: 2021-09-29 15:40:44.585519+00:00
+
+"""
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision = "40d8ee1342f2"
+down_revision = "4899e94653f1"
+branch_labels = None
+depends_on = None
+
+
+def upgrade():
+    # ### commands auto generated by Alembic - please adjust! ###
+    op.create_index(
+        op.f("ix_pepys_Activations_end"), "Activations", ["end"], unique=False, schema="pepys"
+    )
+    op.create_index(
+        op.f("ix_pepys_Activations_start"), "Activations", ["start"], unique=False, schema="pepys"
+    )
+    op.create_index(
+        op.f("ix_pepys_Comments_time"), "Comments", ["time"], unique=False, schema="pepys"
+    )
+    op.create_index(
+        op.f("ix_pepys_Contacts_time"), "Contacts", ["time"], unique=False, schema="pepys"
+    )
+    op.create_index(
+        op.f("ix_pepys_Geometries_end"), "Geometries", ["end"], unique=False, schema="pepys"
+    )
+    op.create_index(
+        op.f("ix_pepys_Geometries_start"), "Geometries", ["start"], unique=False, schema="pepys"
+    )
+    op.create_index(op.f("ix_pepys_Media_time"), "Media", ["time"], unique=False, schema="pepys")
+    op.create_index(op.f("ix_pepys_States_time"), "States", ["time"], unique=False, schema="pepys")
+    # ### end Alembic commands ###
+
+
+def downgrade():
+    # ### commands auto generated by Alembic - please adjust! ###
+    op.drop_index(op.f("ix_pepys_States_time"), table_name="States", schema="pepys")
+    op.drop_index(op.f("ix_pepys_Media_time"), table_name="Media", schema="pepys")
+    op.drop_index(op.f("ix_pepys_Geometries_start"), table_name="Geometries", schema="pepys")
+    op.drop_index(op.f("ix_pepys_Geometries_end"), table_name="Geometries", schema="pepys")
+    op.drop_index(op.f("ix_pepys_Contacts_time"), table_name="Contacts", schema="pepys")
+    op.drop_index(op.f("ix_pepys_Comments_time"), table_name="Comments", schema="pepys")
+    op.drop_index(op.f("ix_pepys_Activations_start"), table_name="Activations", schema="pepys")
+    op.drop_index(op.f("ix_pepys_Activations_end"), table_name="Activations", schema="pepys")
+    # ### end Alembic commands ###