BAG2LoaderMain.java

  1. /*
  2.  * Copyright (C) 2021 B3Partners B.V.
  3.  *
  4.  * SPDX-License-Identifier: MIT
  5.  *
  6.  */

  7. package nl.b3p.brmo.bag2.loader.cli;

  8. import static nl.b3p.brmo.bag2.schema.BAG2SchemaMapper.METADATA_TABLE_NAME;
  9. import static nl.b3p.brmo.bag2.schema.BAG2SchemaMapper.Metadata.CURRENT_TECHNISCHE_DATUM;
  10. import static nl.b3p.brmo.bag2.schema.BAG2SchemaMapper.Metadata.FILTER_GEOMETRIE;
  11. import static nl.b3p.brmo.bag2.schema.BAG2SchemaMapper.Metadata.GEMEENTE_CODES;
  12. import static nl.b3p.brmo.bag2.schema.BAG2SchemaMapper.Metadata.STAND_LOAD_TECHNISCHE_DATUM;
  13. import static nl.b3p.brmo.bag2.schema.BAG2SchemaMapper.Metadata.STAND_LOAD_TIME;
  14. import static nl.b3p.brmo.bgt.loader.Utils.getMessageFormattedString;

  15. import java.io.FileInputStream;
  16. import java.io.IOException;
  17. import java.io.InputStream;
  18. import java.net.CookieManager;
  19. import java.net.URI;
  20. import java.net.http.HttpClient;
  21. import java.net.http.HttpRequest;
  22. import java.net.http.HttpResponse;
  23. import java.nio.file.Files;
  24. import java.nio.file.Path;
  25. import java.sql.PreparedStatement;
  26. import java.text.SimpleDateFormat;
  27. import java.time.LocalDate;
  28. import java.util.Date;
  29. import java.util.HashMap;
  30. import java.util.HashSet;
  31. import java.util.Map;
  32. import java.util.Set;
  33. import java.util.regex.Matcher;
  34. import java.util.regex.Pattern;
  35. import nl.b3p.brmo.bag2.loader.BAG2Database;
  36. import nl.b3p.brmo.bag2.loader.BAG2GMLMutatieGroepStream;
  37. import nl.b3p.brmo.bag2.loader.BAG2LoaderUtils;
  38. import nl.b3p.brmo.bag2.loader.BAG2ProgressReporter;
  39. import nl.b3p.brmo.bag2.schema.BAG2ObjectTableWriter;
  40. import nl.b3p.brmo.bag2.schema.BAG2ObjectType;
  41. import nl.b3p.brmo.bag2.schema.BAG2Schema;
  42. import nl.b3p.brmo.bag2.schema.BAG2SchemaMapper;
  43. import nl.b3p.brmo.schema.ObjectType;
  44. import nl.b3p.brmo.sql.GeometryHandlingPreparedStatementBatch;
  45. import nl.b3p.brmo.sql.LoggingQueryRunner;
  46. import nl.b3p.brmo.sql.QueryBatch;
  47. import nl.b3p.brmo.sql.dialect.OracleDialect;
  48. import nl.b3p.brmo.util.ResumingInputStream;
  49. import nl.b3p.brmo.util.http.HttpClientWrapper;
  50. import nl.b3p.brmo.util.http.HttpStartRangeInputStreamProvider;
  51. import nl.b3p.brmo.util.http.wrapper.Java11HttpClientWrapper;
  52. import org.apache.commons.compress.archivers.zip.ZipArchiveEntry;
  53. import org.apache.commons.compress.archivers.zip.ZipArchiveInputStream;
  54. import org.apache.commons.io.input.CloseShieldInputStream;
  55. import org.apache.commons.lang3.tuple.Pair;
  56. import org.apache.commons.logging.Log;
  57. import org.apache.commons.logging.LogFactory;
  58. import org.apache.log4j.PropertyConfigurator;
  59. import org.geotools.util.logging.Logging;
  60. import org.locationtech.jts.geom.Geometry;
  61. import org.locationtech.jts.io.WKTReader;
  62. import picocli.CommandLine;
  63. import picocli.CommandLine.Command;
  64. import picocli.CommandLine.ExitCode;
  65. import picocli.CommandLine.IVersionProvider;
  66. import picocli.CommandLine.Mixin;
  67. import picocli.CommandLine.Option;
  68. import picocli.CommandLine.Parameters;

  69. @Command(
  70.     name = "bag2-loader",
  71.     mixinStandardHelpOptions = true,
  72.     versionProvider = BAG2LoaderMain.class,
  73.     resourceBundle = BAG2LoaderUtils.BUNDLE_NAME,
  74.     subcommands = {BAG2MutatiesCommand.class})
  75. public class BAG2LoaderMain implements IVersionProvider {
  76.   private static Log log;

  77.   /* zodat we een JNDI database kunnen gebruiken */
  78.   private BAG2Database bag2Database = null;

  79.   private Set<BAG2ObjectType> objectTypesWithSchemaCreated = new HashSet<>();

  80.   private Map<BAG2ObjectType, Set<Pair<Object, Object>>> keysPerObjectType = new HashMap<>();

  81.   /**
  82.    * init logging.
  83.    *
  84.    * @param standAlone set to {@code false} when using in a preconfigured environment, eg. calling
  85.    *     methods from a servlet, use {@code true} for commandline usage.
  86.    */
  87.   public static void configureLogging(boolean standAlone) {
  88.     if (standAlone) {
  89.       PropertyConfigurator.configure(
  90.           BAG2LoaderMain.class.getResourceAsStream("/bag2-loader-cli-log4j.properties"));
  91.       log = LogFactory.getLog(BAG2LoaderMain.class);
  92.       try {
  93.         Logging.ALL.setLoggerFactory("org.geotools.util.logging.Log4JLoggerFactory");
  94.       } catch (ClassNotFoundException ignored) {
  95.       }
  96.     } else {
  97.       log = LogFactory.getLog(BAG2LoaderMain.class);
  98.     }
  99.   }

  100.   public static void main(String... args) {
  101.     configureLogging(true);

  102.     CommandLine cmd = new CommandLine(new BAG2LoaderMain()).setUsageHelpAutoWidth(true);
  103.     System.exit(cmd.execute(args));
  104.   }

  105.   @Override
  106.   public String[] getVersion() {
  107.     return new String[] {BAG2LoaderUtils.getLoaderVersion(), BAG2LoaderUtils.getUserAgent()};
  108.   }

  109.   @Command(name = "load", sortOptions = false)
  110.   public int load(
  111.       @Mixin BAG2DatabaseOptions dbOptions,
  112.       @Mixin BAG2LoadOptions loadOptions,
  113.       @Mixin BAG2ProgressOptions progressOptions,
  114.       @Parameters(paramLabel = "<file>") String[] filenames,
  115.       @Option(
  116.               names = {"-h", "--help"},
  117.               usageHelp = true)
  118.           boolean showHelp)
  119.       throws Exception {

  120.     log.info(BAG2LoaderUtils.getUserAgent());

  121.     try (BAG2Database db = getBAG2Database(dbOptions)) {
  122.       BAG2ProgressReporter progressReporter =
  123.           progressOptions.isConsoleProgressEnabled()
  124.               ? new BAG2ConsoleProgressReporter()
  125.               : new BAG2ProgressReporter();

  126.       loadFiles(db, dbOptions, loadOptions, progressReporter, filenames, null);
  127.       return ExitCode.OK;
  128.     }
  129.   }

  130.   @Command(name = "apply-geo-filter", sortOptions = false)
  131.   public int applyGeoFilterCommand(
  132.       @Mixin BAG2DatabaseOptions dbOptions,
  133.       @CommandLine.Option(names = "--geo-filter", paramLabel = "<wkt>") String geoFilter)
  134.       throws Exception {
  135.     log.info(BAG2LoaderUtils.getUserAgent());

  136.     try (BAG2Database db = getBAG2Database(dbOptions)) {
  137.       applyGeoFilter(db, new BAG2LoadOptions().setGeoFilter(geoFilter));
  138.       return ExitCode.OK;
  139.     }
  140.   }

  141.   public BAG2Database getBAG2Database(BAG2DatabaseOptions dbOptions) throws ClassNotFoundException {
  142.     if (bag2Database == null) {
  143.       bag2Database = new BAG2Database(dbOptions);
  144.     }
  145.     return bag2Database;
  146.   }

  147.   public void setBag2Database(BAG2Database bag2Database) {
  148.     this.bag2Database = bag2Database;
  149.   }

  150.   public void loadFiles(
  151.       BAG2Database db,
  152.       BAG2DatabaseOptions dbOptions,
  153.       BAG2LoadOptions loadOptions,
  154.       BAG2ProgressReporter progressReporter,
  155.       String[] filenames,
  156.       CookieManager cookieManager)
  157.       throws Exception {

  158.     if (filenames.length == 1 && Files.isDirectory(Path.of(filenames[0]))) {
  159.       log.info("Directory opgegeven, kijken naar toepasbare mutaties...");
  160.       filenames =
  161.           Files.list(Path.of(filenames[0]))
  162.               .filter(p -> !Files.isDirectory(p) && p.getFileName().toString().endsWith(".zip"))
  163.               .map(p -> p.toAbsolutePath().toString())
  164.               .toArray(String[]::new);
  165.       if (filenames.length == 0) {
  166.         log.info("Geen ZIP bestanden gevonden, niets te doen");
  167.       } else {
  168.         applyMutaties(db, dbOptions, loadOptions, progressReporter, filenames, null);
  169.       }
  170.       return;
  171.     }

  172.     BAG2LoaderUtils.BAGExtractSelectie bagExtractLevering =
  173.         BAG2LoaderUtils.getBAGExtractSelectieFromZip(filenames[0]);

  174.     if (bagExtractLevering.isStand()) {
  175.       if (bagExtractLevering.isGebiedNLD()) {
  176.         if (filenames.length > 1) {
  177.           throw new IllegalArgumentException(
  178.               "Inladen stand heel Nederland: teveel bestanden opgegeven");
  179.         }
  180.       } else {
  181.         // Verify all filenames are gemeentestanden
  182.         Set<String> gemeenteCodes = new HashSet<>();
  183.         for (int i = 1; i < filenames.length; i++) {
  184.           BAG2LoaderUtils.BAGExtractSelectie nextBagExtractLevering =
  185.               BAG2LoaderUtils.getBAGExtractSelectieFromZip(filenames[i]);

  186.           if (!nextBagExtractLevering.isStand() || nextBagExtractLevering.isGebiedNLD()) {
  187.             throw new IllegalArgumentException(
  188.                 "Inladen stand gemeentes, ongeldig bestand opgegeven (geen gemeentestand): "
  189.                     + filenames[i]);
  190.           }
  191.           Set<String> nextBagExtractLeveringGemeenteCodes =
  192.               nextBagExtractLevering.getGemeenteCodes();
  193.           if (gemeenteCodes.stream().anyMatch(nextBagExtractLeveringGemeenteCodes::contains)) {
  194.             throw new IllegalArgumentException(
  195.                 "Inladen stand gemeentes, dubbele gemeentecode in bestand: " + filenames[i]);
  196.           }
  197.           gemeenteCodes.addAll(nextBagExtractLeveringGemeenteCodes);
  198.         }
  199.       }

  200.       new LoggingQueryRunner().update(db.getConnection(), "create sequence objectid_seq");

  201.       loadStandFiles(db, dbOptions, loadOptions, progressReporter, filenames, cookieManager);
  202.     } else {
  203.       // Process mutaties while ignoring files not applicable
  204.       applyMutaties(db, dbOptions, loadOptions, progressReporter, filenames, null);
  205.     }
  206.   }

  207.   /**
  208.    * Only called after list of files have been checked to only have been entire NL stand or unique
  209.    * gemeente standen.
  210.    */
  211.   private void loadStandFiles(
  212.       BAG2Database db,
  213.       BAG2DatabaseOptions dbOptions,
  214.       BAG2LoadOptions loadOptions,
  215.       BAG2ProgressReporter progressReporter,
  216.       String[] filenames,
  217.       CookieManager cookieManager)
  218.       throws Exception {
  219.     try {
  220.       // When loading multiple standen (for gemeentes), set ignore duplicates so the seen
  221.       // object keys are kept in
  222.       // memory so duplicates can be ignored. Don't keep keys in memory for entire NL stand.
  223.       loadOptions.setIgnoreDuplicates(filenames.length > 1);

  224.       // Multiple gemeentes can also be provided in a single ZIP file, check the
  225.       // Leveringsdocument whether that is
  226.       // the case
  227.       if (filenames.length == 1) {
  228.         BAG2LoaderUtils.BAGExtractSelectie levering =
  229.             BAG2LoaderUtils.getBAGExtractSelectieFromZip(filenames[0]);
  230.         if (!levering.isGebiedNLD()) {
  231.           loadOptions.setIgnoreDuplicates(levering.getGemeenteCodes().size() > 1);
  232.         }
  233.       }

  234.       BAG2GMLMutatieGroepStream.BagInfo bagInfo = null;
  235.       String lastFilename = null;

  236.       // Keep track of which gemeentes are loaded so the correct mutations can be processed
  237.       // later
  238.       Set<String> gemeenteIdentificaties = new HashSet<>();

  239.       for (String filename : filenames) {
  240.         BAG2GMLMutatieGroepStream.BagInfo latestBagInfo =
  241.             loadBAG2ExtractFromURLorFile(db, loadOptions, dbOptions, progressReporter, filename);
  242.         if (bagInfo != null) {
  243.           // For gemeentes the BagInfo must be the same so the standen are of the same
  244.           // date
  245.           if (!latestBagInfo.equalsExceptGemeenteIdentificaties(bagInfo)) {
  246.             throw new IllegalArgumentException(
  247.                 String.format(
  248.                     "Incompatible BagInfo for file \"%s\" (%s) compared to last file \"%s\" (%s)",
  249.                     filename, latestBagInfo, lastFilename, bagInfo));
  250.           }
  251.         }
  252.         bagInfo = latestBagInfo;

  253.         // For NL stand this will be "9999"
  254.         gemeenteIdentificaties.addAll(bagInfo.getGemeenteIdentificaties());
  255.         lastFilename = filename;
  256.       }
  257.       if (bagInfo != null) {
  258.         // TODO: when loading gemeente without rare objects such as
  259.         // ligplaatsen/standplaatsen, table will not be created
  260.         // and a future change with such an object will fail. Should create entire schema
  261.         // up-front instead of when first
  262.         // encountering object type
  263.         createKeysAndIndexes(db, loadOptions, dbOptions, progressReporter);

  264.         updateMetadata(
  265.             db, loadOptions, true, gemeenteIdentificaties, bagInfo.getStandTechnischeDatum());
  266.       }
  267.       db.getConnection().commit();

  268.       applyGeoFilter(db, loadOptions);
  269.     } finally {
  270.       progressReporter.reportTotalSummary();
  271.     }
  272.   }

  273.   public void applyMutaties(
  274.       BAG2Database db,
  275.       BAG2DatabaseOptions dbOptions,
  276.       BAG2LoadOptions loadOptions,
  277.       BAG2ProgressReporter progressReporter,
  278.       String[] urls,
  279.       CookieManager cookieManager)
  280.       throws Exception {
  281.     if (urls.length == 0) {
  282.       return;
  283.     }
  284.     BAG2LoaderUtils.BAGExtractSelectie bagExtractLevering =
  285.         BAG2LoaderUtils.getBAGExtractSelectieFromZip(urls[0]);
  286.     if (bagExtractLevering.isGebiedNLD()) {
  287.       applyNLMutaties(db, dbOptions, loadOptions, progressReporter, urls, cookieManager);
  288.     } else {
  289.       applyGemeenteMutaties(db, dbOptions, loadOptions, progressReporter, urls, cookieManager);
  290.     }
  291.   }

  292.   private void applyGemeenteMutaties(
  293.       BAG2Database db,
  294.       BAG2DatabaseOptions dbOptions,
  295.       BAG2LoadOptions loadOptions,
  296.       BAG2ProgressReporter progressReporter,
  297.       String[] urls,
  298.       CookieManager cookieManager)
  299.       throws Exception {
  300.     LocalDate currentTechnischeDatum = db.getCurrentTechnischeDatum();
  301.     Set<String> gemeenteCodes = db.getGemeenteCodes();

  302.     Set<Integer> applicableMutatieIndexes;
  303.     do {
  304.       applicableMutatieIndexes = new HashSet<>();

  305.       Set<String> missingGemeentes = new HashSet<>(gemeenteCodes);
  306.       for (int i = 0; i < urls.length; i++) {
  307.         BAG2LoaderUtils.BAGExtractSelectie bagExtractLevering =
  308.             BAG2LoaderUtils.getBAGExtractSelectieFromZip(urls[i]);

  309.         if (!bagExtractLevering.isGebiedNLD()
  310.             && !bagExtractLevering.isStand()
  311.             && bagExtractLevering.getMutatiesFrom().equals(currentTechnischeDatum)) {

  312.           for (String gemeenteCode : bagExtractLevering.getGemeenteCodes()) {
  313.             if (gemeenteCodes.contains(gemeenteCode)) {
  314.               applicableMutatieIndexes.add(i);
  315.               missingGemeentes.remove(gemeenteCode);
  316.             }
  317.           }
  318.         }
  319.       }

  320.       if (applicableMutatieIndexes.isEmpty()) {
  321.         log.info(
  322.             String.format(
  323.                 "Geen nieuw toe te passen gemeentemutatiebestanden gevonden voor huidige stand technische datum %s, klaar",
  324.                 currentTechnischeDatum));
  325.         break;
  326.       }

  327.       // Check whether applicable mutaties are available for all gemeentecodes because they
  328.       // need to be processed
  329.       // at the same time to ignore duplicates
  330.       if (!missingGemeentes.isEmpty()) {
  331.         throw new IllegalArgumentException(
  332.             String.format(
  333.                 "Kan geen gemeente mutaties toepassen voor gemeentes %s vanaf stand technische datum %s, in opgegeven mutatiebestanden ontbreken gemeentecodes %s",
  334.                 gemeenteCodes, currentTechnischeDatum, missingGemeentes));
  335.       }

  336.       log.info(
  337.           String.format(
  338.               "Toepassen gemeentemutaties voor %d gemeentes vanaf stand technische datum %s...",
  339.               gemeenteCodes.size(), currentTechnischeDatum));

  340.       BAG2GMLMutatieGroepStream.BagInfo bagInfo = null;

  341.       loadOptions.setIgnoreDuplicates(gemeenteCodes.size() > 1);
  342.       for (int index : applicableMutatieIndexes) {
  343.         bagInfo =
  344.             loadBAG2ExtractFromURLorFile(
  345.                 db, loadOptions, dbOptions, progressReporter, urls[index], cookieManager);
  346.       }
  347.       currentTechnischeDatum =
  348.           new java.sql.Date(bagInfo.getStandTechnischeDatum().getTime()).toLocalDate();
  349.       updateMetadata(db, loadOptions, false, null, bagInfo.getStandTechnischeDatum());
  350.       db.getConnection().commit();
  351.       // Duplicates need only be checked for mutaties for a single from date, clear cache to
  352.       // reduce memory usage
  353.       clearDuplicatesCache();
  354.       log.info("Mutaties verwerkt, huidige stand technische datum: " + currentTechnischeDatum);

  355.     } while (true);
  356.     applyGeoFilter(db, loadOptions);
  357.   }

  358.   private void applyNLMutaties(
  359.       BAG2Database db,
  360.       BAG2DatabaseOptions dbOptions,
  361.       BAG2LoadOptions loadOptions,
  362.       BAG2ProgressReporter progressReporter,
  363.       String[] urls,
  364.       CookieManager cookieManager)
  365.       throws Exception {
  366.     LocalDate currentTechnischeDatum = db.getCurrentTechnischeDatum();
  367.     do {
  368.       String applicatieMutatieURL = null;

  369.       for (String url : urls) {
  370.         BAG2LoaderUtils.BAGExtractSelectie bagExtractSelectie =
  371.             BAG2LoaderUtils.getBAGExtractSelectieFromZip(url);

  372.         if (bagExtractSelectie.isGebiedNLD()
  373.             && !bagExtractSelectie.isStand()
  374.             && bagExtractSelectie.getMutatiesFrom().equals(currentTechnischeDatum)) {
  375.           applicatieMutatieURL = url;
  376.         }
  377.       }

  378.       if (applicatieMutatieURL == null) {
  379.         log.info(
  380.             String.format(
  381.                 "Geen nieuw toe te passen mutatiebestanden gevonden voor huidige stand technische datum %s, klaar",
  382.                 currentTechnischeDatum));
  383.         break;
  384.       }

  385.       log.info(
  386.           String.format(
  387.               "Toepassen mutaties vanaf stand technische datum %s...", currentTechnischeDatum));

  388.       BAG2GMLMutatieGroepStream.BagInfo bagInfo =
  389.           loadBAG2ExtractFromURLorFile(
  390.               db, loadOptions, dbOptions, progressReporter, applicatieMutatieURL, cookieManager);
  391.       currentTechnischeDatum =
  392.           new java.sql.Date(bagInfo.getStandTechnischeDatum().getTime()).toLocalDate();
  393.       updateMetadata(db, loadOptions, false, null, bagInfo.getStandTechnischeDatum());
  394.       db.getConnection().commit();
  395.       log.info("Mutaties verwerkt, huidige stand technische datum: " + currentTechnischeDatum);
  396.     } while (true);
  397.     applyGeoFilter(db, loadOptions);
  398.   }

  399.   private static final int SRID = 28992;

  400.   public void applyGeoFilter(BAG2Database db, BAG2LoadOptions loadOptions) throws Exception {

  401.     String filterMetadata;

  402.     if (loadOptions.getGeoFilter() != null) {
  403.       filterMetadata = loadOptions.getGeoFilter();
  404.       try {
  405.         new WKTReader().read(filterMetadata);
  406.       } catch (Exception e) {
  407.         log.error("Ongeldige WKT gespecificeerd voor geometrie-filter", e);
  408.         return;
  409.       }
  410.       db.setMetadataValue(FILTER_GEOMETRIE, filterMetadata);
  411.     } else {
  412.       filterMetadata = db.getMetadata(FILTER_GEOMETRIE);
  413.     }

  414.     if (filterMetadata == null) {
  415.       return;
  416.     }
  417.     Geometry geometry;
  418.     try {
  419.       geometry = new WKTReader().read(filterMetadata);
  420.       geometry.setSRID(SRID);
  421.     } catch (Exception e) {
  422.       log.error(
  423.           String.format(
  424.               "Geometrie-filter niet toegepast, fout bij parsen %s als WKT, waarde: \"%s\"",
  425.               FILTER_GEOMETRIE, filterMetadata),
  426.           e);
  427.       return;
  428.     }
  429.     log.info("Verwijderen records die niet binnen geometrie-filter vallen...");

  430.     BAG2SchemaMapper schemaMapper = BAG2SchemaMapper.getInstance();
  431.     BAG2Schema bag2Schema = BAG2Schema.getInstance();

  432.     db.getConnection().setAutoCommit(false);

  433.     String[] objectTypes =
  434.         new String[] {"Ligplaats", "Standplaats", "Pand", "Verblijfsobject", "Woonplaats"};

  435.     for (String objectTypeName : objectTypes) {
  436.       ObjectType objectType = bag2Schema.getObjectTypeByName(objectTypeName);
  437.       String tableName = schemaMapper.getTableNameForObjectType(objectType, "");
  438.       String geoCondition =
  439.           db.getDialect() instanceof OracleDialect
  440.               ? "st_intersects(?, geometrie) = 'FALSE'"
  441.               : "not st_intersects(geometrie, ?)"; // Also works for Oracle 23c, not < 23c
  442.       String sql =
  443.           String.format(
  444.               """
  445.                 delete from %s
  446.                 where identificatie in (
  447.                   select identificatie from %s
  448.                   where eindgeldigheid is null and tijdstipinactief is null
  449.                   and %s
  450.                 )""",
  451.               tableName, tableName, geoCondition);
  452.       try (QueryBatch queryBatch =
  453.           new GeometryHandlingPreparedStatementBatch(
  454.               db.getConnection(), sql, 1, db.getDialect(), new Boolean[] {true}, false)) {
  455.         log.info("Verwijderen van records voor " + objectType.getName());
  456.         queryBatch.addBatch(new Object[] {geometry});
  457.       }
  458.     }

  459.     // Don't use getObjectTypeByName(), because heeftAlsNevenadres join tables need to be directly
  460.     // in sql literal anyway
  461.     String sql =
  462.         """
  463.         delete from nummeraanduiding n
  464.         where not exists (select 1 from verblijfsobject v where v.heeftalshoofdadres = n.identificatie)
  465.         and not exists (select 1 from verblijfsobject_nevenadres vn where vn.heeftalsnevenadres = n.identificatie)
  466.         and not exists (select 1 from ligplaats l where l.heeftalshoofdadres = n.identificatie)
  467.         and not exists (select 1 from ligplaats_nevenadres ln where ln.heeftalsnevenadres = n.identificatie)
  468.         and not exists (select 1 from standplaats s where s.heeftalshoofdadres = n.identificatie)
  469.         and not exists (select 1 from standplaats_nevenadres sn where sn.heeftalsnevenadres = n.identificatie)
  470.         """;
  471.     try (PreparedStatement ps = db.getConnection().prepareStatement(sql)) {
  472.       log.info("Verwijderen niet-gerefereerde nummeraanduiding-records");
  473.       ps.executeUpdate();
  474.     }
  475.     sql =
  476.         """
  477.         delete from openbareruimte o where not exists (select 1 from nummeraanduiding where ligtaan = o.identificatie)
  478.         """;
  479.     try (PreparedStatement ps = db.getConnection().prepareStatement(sql)) {
  480.       log.info("Verwijderen niet-gerefereerde openbareruimte-records");
  481.       ps.executeUpdate();
  482.     }
  483.     db.getConnection().commit();
  484.     log.info("Klaar met verwijderen records buiten geometrie-filter");
  485.   }

  486.   private void createKeysAndIndexes(
  487.       BAG2Database db,
  488.       BAG2LoadOptions loadOptions,
  489.       BAG2DatabaseOptions databaseOptions,
  490.       BAG2ProgressReporter progressReporter)
  491.       throws Exception {
  492.     BAG2ObjectTableWriter writer = db.createObjectTableWriter(loadOptions, databaseOptions);
  493.     writer.setProgressUpdater(progressReporter);
  494.     for (BAG2ObjectType objectType : objectTypesWithSchemaCreated) {
  495.       writer.createKeys(objectType); // BAG2 writer is always a single ObjectType unlike BGT
  496.       writer.createIndexes(objectType);
  497.     }
  498.   }

  499.   private BAG2GMLMutatieGroepStream.BagInfo loadBAG2ExtractFromURLorFile(
  500.       BAG2Database db,
  501.       BAG2LoadOptions loadOptions,
  502.       BAG2DatabaseOptions dbOptions,
  503.       BAG2ProgressReporter progressReporter,
  504.       String url)
  505.       throws Exception {
  506.     return loadBAG2ExtractFromURLorFile(db, loadOptions, dbOptions, progressReporter, url, null);
  507.   }

  508.   private BAG2GMLMutatieGroepStream.BagInfo loadBAG2ExtractFromURLorFile(
  509.       BAG2Database db,
  510.       BAG2LoadOptions loadOptions,
  511.       BAG2DatabaseOptions dbOptions,
  512.       BAG2ProgressReporter progressReporter,
  513.       String url,
  514.       CookieManager cookieManager)
  515.       throws Exception {
  516.     HttpClientWrapper<HttpRequest.Builder, HttpResponse<InputStream>> httpClientWrapper =
  517.         cookieManager == null
  518.             ? new Java11HttpClientWrapper()
  519.             : new Java11HttpClientWrapper(HttpClient.newBuilder().cookieHandler(cookieManager));

  520.     if (url.startsWith("http://") || url.startsWith("https://")) {
  521.       try (InputStream in =
  522.           new ResumingInputStream(
  523.               new HttpStartRangeInputStreamProvider(URI.create(url), httpClientWrapper))) {
  524.         return loadBAG2ExtractFromStream(db, loadOptions, dbOptions, progressReporter, url, in);
  525.       }
  526.     }
  527.     if (url.endsWith(".zip")) {
  528.       try (InputStream in = new FileInputStream(url)) {
  529.         return loadBAG2ExtractFromStream(db, loadOptions, dbOptions, progressReporter, url, in);
  530.       }
  531.     }

  532.     throw new IllegalArgumentException(getMessageFormattedString("load.invalid_file", url));
  533.   }

  534.   private BAG2GMLMutatieGroepStream.BagInfo loadBAG2ExtractFromStream(
  535.       BAG2Database db,
  536.       BAG2LoadOptions loadOptions,
  537.       BAG2DatabaseOptions dbOptions,
  538.       BAG2ProgressReporter progressReporter,
  539.       String name,
  540.       InputStream input)
  541.       throws Exception {
  542.     BAG2GMLMutatieGroepStream.BagInfo bagInfo = null;
  543.     Set<String> gemeenteIdentificaties = new HashSet<>();
  544.     try (ZipArchiveInputStream zip = new ZipArchiveInputStream(input)) {
  545.       ZipArchiveEntry entry = zip.getNextZipEntry();
  546.       while (entry != null) {
  547.         if (entry.getName().matches("[0-9]{4}(STA|VBO|OPR|NUM|LIG|PND|WPL).*\\.xml")) {
  548.           // Load extracted zipfile
  549.           bagInfo =
  550.               loadXmlEntriesFromZipFile(
  551.                   db, loadOptions, dbOptions, progressReporter, name, zip, entry);
  552.           break;
  553.         }

  554.         if (entry.getName().matches("[0-9]{4}GEM[0-9]{8}\\.zip")) {
  555.           bagInfo =
  556.               loadBAG2ExtractFromStream(
  557.                   db,
  558.                   loadOptions,
  559.                   dbOptions,
  560.                   progressReporter,
  561.                   name,
  562.                   CloseShieldInputStream.wrap(zip));
  563.         }

  564.         // Process single and double-nested ZIP files

  565.         if (entry.getName().matches("[0-9]{4}(STA|VBO|OPR|NUM|LIG|PND|WPL).*\\.zip")
  566.             || entry.getName().matches("[0-9]{4}MUT[0-9]{8}-[0-9]{8}\\.zip")) {
  567.           ZipArchiveInputStream nestedZip = new ZipArchiveInputStream(zip);
  568.           bagInfo =
  569.               loadXmlEntriesFromZipFile(
  570.                   db,
  571.                   loadOptions,
  572.                   dbOptions,
  573.                   progressReporter,
  574.                   entry.getName(),
  575.                   nestedZip,
  576.                   nestedZip.getNextZipEntry());
  577.         }

  578.         if (entry.getName().matches("[0-9]{4}Inactief.*\\.zip")) {
  579.           ZipArchiveInputStream nestedZip = new ZipArchiveInputStream(zip);
  580.           ZipArchiveEntry nestedEntry = nestedZip.getNextZipEntry();
  581.           while (nestedEntry != null) {
  582.             if (nestedEntry.getName().matches("[0-9]{4}IA.*\\.zip")) {
  583.               ZipArchiveInputStream moreNestedZip = new ZipArchiveInputStream(nestedZip);
  584.               bagInfo =
  585.                   loadXmlEntriesFromZipFile(
  586.                       db,
  587.                       loadOptions,
  588.                       dbOptions,
  589.                       progressReporter,
  590.                       nestedEntry.getName(),
  591.                       moreNestedZip,
  592.                       moreNestedZip.getNextZipEntry());
  593.             }
  594.             nestedEntry = nestedZip.getNextZipEntry();
  595.           }
  596.         }

  597.         if (bagInfo != null) {
  598.           gemeenteIdentificaties.addAll(bagInfo.getGemeenteIdentificaties());
  599.         }

  600.         try {
  601.           entry = zip.getNextZipEntry();
  602.         } catch (IOException e) {
  603.           // Reading the ZIP from HTTP may give this error, but it is a normal end...
  604.           if ("Truncated ZIP file".equals(e.getMessage())) {
  605.             break;
  606.           }
  607.         }
  608.       }
  609.     }
  610.     if (bagInfo != null) {
  611.       // Update BagInfo with all seen gemeenteIdentificaties in case we processed a ZIP with
  612.       // multiple gemeentestanden
  613.       bagInfo.setGemeenteIdentificaties(gemeenteIdentificaties);
  614.     }
  615.     return bagInfo;
  616.   }

  617.   private static BAG2ObjectType getObjectTypeFromFilename(String filename) {
  618.     Matcher m =
  619.         Pattern.compile(".*[0-9]{4}(IA)?(MUT|STA|VBO|OPR|NUM|LIG|PND|WPL).*\\.(xml|zip)")
  620.             .matcher(filename);
  621.     if (!m.matches()) {
  622.       throw new IllegalArgumentException("Invalid BAG2 filename: " + filename);
  623.     }
  624.     String objectTypeName = null;
  625.     switch (m.group(2)) {
  626.       case "MUT":
  627.         break;
  628.       case "STA":
  629.         objectTypeName = "Standplaats";
  630.         break;
  631.       case "OPR":
  632.         objectTypeName = "OpenbareRuimte";
  633.         break;
  634.       case "VBO":
  635.         objectTypeName = "Verblijfsobject";
  636.         break;
  637.       case "NUM":
  638.         objectTypeName = "Nummeraanduiding";
  639.         break;
  640.       case "LIG":
  641.         objectTypeName = "Ligplaats";
  642.         break;
  643.       case "PND":
  644.         objectTypeName = "Pand";
  645.         break;
  646.       case "WPL":
  647.         objectTypeName = "Woonplaats";
  648.         break;
  649.     }
  650.     if (objectTypeName == null) {
  651.       return null;
  652.     } else {
  653.       return BAG2Schema.getInstance().getObjectTypeByName(objectTypeName);
  654.     }
  655.   }

  656.   private void updateMetadata(
  657.       BAG2Database db,
  658.       BAG2LoadOptions loadOptions,
  659.       boolean stand,
  660.       Set<String> gemeenteIdentificaties,
  661.       Date standTechnischeDatum)
  662.       throws Exception {
  663.     // Check if metadata table already exists. For PostgreSQL we can use the metadata table in
  664.     // the public schema
  665.     if (!db.getDialect().tableExists(db.getConnection(), METADATA_TABLE_NAME)) {
  666.       // Create a new metadata table, for Oracle as BAG is in separate schema, for PostgreSQL
  667.       // if loading BAG
  668.       // into a non-brmo RSGB database
  669.       db.createMetadataTable(loadOptions);
  670.     }

  671.     db.setMetadataValue(
  672.         BAG2SchemaMapper.Metadata.LOADER_VERSION, BAG2LoaderUtils.getLoaderVersion());
  673.     SimpleDateFormat df = new SimpleDateFormat("yyyy-MM-dd");
  674.     if (stand) {
  675.       db.setMetadataValue(
  676.           STAND_LOAD_TIME, new SimpleDateFormat("yyyy-MM-dd HH:mm:ss").format(new Date()));
  677.       db.setMetadataValue(STAND_LOAD_TECHNISCHE_DATUM, df.format(standTechnischeDatum));
  678.       db.setMetadataValue(GEMEENTE_CODES, String.join(",", gemeenteIdentificaties));
  679.     }
  680.     db.setMetadataValue(CURRENT_TECHNISCHE_DATUM, df.format(standTechnischeDatum));
  681.   }

  682.   private void clearDuplicatesCache() {
  683.     keysPerObjectType = new HashMap<>();
  684.   }

  685.   private BAG2GMLMutatieGroepStream.BagInfo loadXmlEntriesFromZipFile(
  686.       BAG2Database db,
  687.       BAG2LoadOptions loadOptions,
  688.       BAG2DatabaseOptions databaseOptions,
  689.       BAG2ProgressReporter progressReporter,
  690.       String name,
  691.       ZipArchiveInputStream zip,
  692.       ZipArchiveEntry entry)
  693.       throws Exception {
  694.     BAG2ObjectType objectType = getObjectTypeFromFilename(name);
  695.     // objectType is null for mutaties, which contain mixed object types instead of a single
  696.     // object type with stand
  697.     boolean schemaCreated = objectType == null || objectTypesWithSchemaCreated.contains(objectType);
  698.     BAG2ObjectTableWriter writer = db.createObjectTableWriter(loadOptions, databaseOptions);
  699.     writer.setProgressUpdater(progressReporter);
  700.     writer.setCreateSchema(!schemaCreated);
  701.     writer.setCreateKeysAndIndexes(false);
  702.     writer.setKeysPerObjectType(keysPerObjectType);
  703.     writer.start(); // sets InitialLoad to true
  704.     writer
  705.         .getProgress()
  706.         .setInitialLoad(!schemaCreated); // For a COPY in transaction, table must be created or
  707.     // truncated in it
  708.     if (objectType == null) {
  709.       // When processing mutaties, set batch size to 1 so all mutaties are processed
  710.       // sequentially and can not
  711.       // conflict with deleting and inserting of old/new versions
  712.       writer.setBatchSize(1);
  713.       // Disable multithreading so deletion of previous versions and new inserts are processed
  714.       // sequentially
  715.       writer.setMultithreading(false);
  716.     }
  717.     progressReporter.startNewFile(name);
  718.     try {
  719.       while (entry != null) {
  720.         progressReporter.startNextSplitFile(entry.getName());
  721.         writer.write(CloseShieldInputStream.wrap(zip));
  722.         if (loadOptions.getMaxObjects() != null
  723.             && writer.getProgress().getObjectCount() == loadOptions.getMaxObjects()) {
  724.           break;
  725.         }
  726.         entry = zip.getNextZipEntry();
  727.       }
  728.       writer.complete();

  729.       if (writer.getProgress().getObjectCount() > 0 && objectType != null) {
  730.         objectTypesWithSchemaCreated.add(objectType);
  731.       }

  732.       return writer.getProgress().getMutatieInfo();
  733.     } catch (Exception e) {
  734.       writer.abortWorkerThread();
  735.       throw e;
  736.     }
  737.   }
  738. }