mirror of
https://gitlab.com/wgp/dougal/software.git
synced 2025-12-06 13:27:08 +00:00
89 lines
2.0 KiB
Python
Executable File
89 lines
2.0 KiB
Python
Executable File
#!/usr/bin/python3
|
|
|
|
"""
|
|
Import raw p111.
|
|
|
|
For each survey in configuration.surveys(), check for new
|
|
or modified final P1/11 files and (re-)import them into the
|
|
database.
|
|
"""
|
|
|
|
import os
|
|
import sys
|
|
import pathlib
|
|
import re
|
|
import configuration
|
|
import p111
|
|
from datastore import Datastore
|
|
|
|
if __name__ == '__main__':
|
|
|
|
print("Reading configuration")
|
|
surveys = configuration.surveys()
|
|
|
|
print("Connecting to database")
|
|
db = Datastore()
|
|
db.connect()
|
|
|
|
print("Reading surveys")
|
|
for survey in surveys:
|
|
print(f'Survey: {survey["id"]} ({survey["schema"]})')
|
|
|
|
db.set_survey(survey["schema"])
|
|
|
|
try:
|
|
raw_p111 = survey["raw"]["p111"]
|
|
except KeyError:
|
|
print("No raw P1/11 configuration")
|
|
exit(0)
|
|
|
|
pattern = raw_p111["pattern"]
|
|
rx = re.compile(pattern["regex"])
|
|
|
|
if "ntbp" in survey["raw"]:
|
|
ntbpRx = re.compile(survey["raw"]["ntbp"]["pattern"]["regex"])
|
|
|
|
for fileprefix in raw_p111["paths"]:
|
|
print(f"Path prefix: {fileprefix}")
|
|
|
|
for globspec in raw_p111["globs"]:
|
|
for filepath in pathlib.Path(fileprefix).glob(globspec):
|
|
filepath = str(filepath)
|
|
print(f"Found {filepath}")
|
|
|
|
if ntbpRx:
|
|
ntbp = ntbpRx.search(filepath) is not None
|
|
else:
|
|
ntbp = False
|
|
|
|
if not db.file_in_db(filepath):
|
|
print("Importing")
|
|
|
|
match = rx.match(os.path.basename(filepath))
|
|
if not match:
|
|
error_message = f"File path not match the expected format! ({filepath} ~ {pattern['regex']})"
|
|
print(error_message, file=sys.stderr)
|
|
print("This file will be ignored!")
|
|
continue
|
|
|
|
file_info = dict(zip(pattern["captures"], match.groups()))
|
|
|
|
p111_data = p111.from_file(filepath)
|
|
|
|
print("Saving")
|
|
|
|
p111_records = p111.p111_type("S", p111_data)
|
|
|
|
db.save_raw_p111(p111_records, file_info, filepath, survey["epsg"], ntbp=ntbp)
|
|
else:
|
|
print("Already in DB")
|
|
|
|
# Update the NTBP status to whatever the latest is,
|
|
# as it might have changed.
|
|
db.set_ntbp(filepath, ntbp)
|
|
if ntbp:
|
|
print("Sequence is NTBP")
|
|
|
|
print("Done")
|
|
|