From d01d493a054dab5c95e946521ebfd6a4d1929122 Mon Sep 17 00:00:00 2001 From: Samier Merchant Date: Wed, 12 Feb 2025 20:54:01 -0500 Subject: [PATCH 1/9] Update ogrct.cpp to remove shared shared proj context (m_psLastContext), which can lead to scenarios where one thread destroys the context while another is still using it Undo https://github.com/OSGeo/gdal/commit/94ede75a44d62203bfb4b7d154d94427cacb1230, which causes segfaults when using gdal in a multi-threaded environment such as a thread worker pool. It might be the case that one thread "destroys" the context (m_psLastContext) while another thread is still using it, leading to a segfault. As you can see with the following line: m_psLastContext = OSRGetProjTLSContext(); --- ogr/ogrct.cpp | 16 ++-------------- 1 file changed, 2 insertions(+), 14 deletions(-) diff --git a/ogr/ogrct.cpp b/ogr/ogrct.cpp index ae93f7163579..d1310fa89dfd 100644 --- a/ogr/ogrct.cpp +++ b/ogr/ogrct.cpp @@ -21,7 +21,6 @@ #include #include #include -#include #include "cpl_conv.h" #include "cpl_error.h" @@ -750,9 +749,6 @@ class OGRProjCT : public OGRCoordinateTransformation double dfThreshold = 0.0; - PJ_CONTEXT *m_psLastContext = nullptr; - std::thread::id m_nLastContextThreadId{}; - PjPtr m_pj{}; bool m_bReversePj = false; @@ -1265,8 +1261,7 @@ OGRProjCT::OGRProjCT(const OGRProjCT &other) m_osTargetSRS(other.m_osTargetSRS), bWebMercatorToWGS84LongLat(other.bWebMercatorToWGS84LongLat), nErrorCount(other.nErrorCount), dfThreshold(other.dfThreshold), - m_psLastContext(nullptr), - m_nLastContextThreadId(std::this_thread::get_id()), m_pj(other.m_pj), + m_pj(other.m_pj), m_bReversePj(other.m_bReversePj), m_bEmitErrors(other.m_bEmitErrors), bNoTransform(other.bNoTransform), m_eStrategy(other.m_eStrategy), m_oTransformations(other.m_oTransformations), @@ -2520,14 +2515,7 @@ int OGRProjCT::TransformWithErrorCodes(size_t nCount, double *x, double *y, /* Select dynamically the best transformation for the data, if */ /* needed. */ /* -------------------------------------------------------------------- */ - PJ_CONTEXT *ctx = m_psLastContext; - const auto nThisThreadId = std::this_thread::get_id(); - if (!ctx || nThisThreadId != m_nLastContextThreadId) - { - m_nLastContextThreadId = nThisThreadId; - m_psLastContext = OSRGetProjTLSContext(); - ctx = m_psLastContext; - } + auto ctx = OSRGetProjTLSContext(); PJ *pj = m_pj; if (!bTransformDone && !pj) From f4ce0348a7749618e5f5d6e8f1652e1baa17fcf0 Mon Sep 17 00:00:00 2001 From: Alan Thomas Date: Sat, 15 Feb 2025 13:59:59 +1100 Subject: [PATCH 2/9] DXF: Don't hide block entities on layer 0 when that layer is frozen --- autotest/ogr/ogr_dxf.py | 33 ++++++++++++++++++++++++-- ogr/ogrsf_frmts/dxf/ogrdxf_feature.cpp | 18 +++++++------- 2 files changed, 40 insertions(+), 11 deletions(-) diff --git a/autotest/ogr/ogr_dxf.py b/autotest/ogr/ogr_dxf.py index b07e71d3d5c3..cc61c92f8d9c 100644 --- a/autotest/ogr/ogr_dxf.py +++ b/autotest/ogr/ogr_dxf.py @@ -3881,7 +3881,7 @@ def test_ogr_dxf_53(): # Test frozen and off layers -def test_ogr_dxf_54(): +def test_ogr_dxf_54(tmp_vsimem): with gdal.config_option("DXF_MERGE_BLOCK_GEOMETRIES", "FALSE"): ds = ogr.Open("data/dxf/frozen-off.dxf") @@ -3897,7 +3897,36 @@ def test_ogr_dxf_54(): ) if isFeatureVisible == (h == "h"): f.DumpReadable() - pytest.fail("Wrong visibility on feature %d" % number) + pytest.fail( + "Wrong visibility on feature %d (testing with layer 0 thawed)" % number + ) + + # Rewrite the test file, this time with layer 0 set as frozen + with open("data/dxf/frozen-off.dxf", "r") as file: + gdal.FileFromMemBuffer( + tmp_vsimem / "frozen-off-with-layer0-frozen.dxf", + file.read().replace( + "0\nLAYER\n 2\n0\n 70\n 0", "0\nLAYER\n 2\n0\n 70\n 1" + ), + ) + + with gdal.config_option("DXF_MERGE_BLOCK_GEOMETRIES", "FALSE"): + ds = ogr.Open( + tmp_vsimem / "frozen-off-with-layer0-frozen.dxf", + ) + lyr = ds.GetLayer(0) + + # Repeat test - outcome should be the same + for number, h in enumerate(featureVisibility): + f = lyr.GetNextFeature() + isFeatureVisible = ( + "#000000)" in f.GetStyleString() or "#ff0000)" in f.GetStyleString() + ) + if isFeatureVisible == (h == "h"): + f.DumpReadable() + pytest.fail( + "Wrong visibility on feature %d (testing with layer 0 frozen)" % number + ) ############################################################################### diff --git a/ogr/ogrsf_frmts/dxf/ogrdxf_feature.cpp b/ogr/ogrsf_frmts/dxf/ogrdxf_feature.cpp index 8bb92b3aab50..36e395127f4e 100644 --- a/ogr/ogrsf_frmts/dxf/ogrdxf_feature.cpp +++ b/ogr/ogrsf_frmts/dxf/ogrdxf_feature.cpp @@ -146,9 +146,9 @@ OGRDXFFeature::GetColor(OGRDXFDataSource *const poDS, (poBlockFeature && poBlockFeature->oStyleProperties.count("Hidden") > 0)) { - // Hidden objects should never be shown no matter what happens, - // so they can be treated as if they are on a frozen layer - iHidden = 2; + // Hidden objects should never be shown no matter what happens + iHidden = 1; + oStyleProperties["Hidden"] = "1"; } else { @@ -166,13 +166,13 @@ OGRDXFFeature::GetColor(OGRDXFDataSource *const poDS, if (pszBlockHidden && atoi(pszBlockHidden) == 2) iHidden = 2; } - } - // If this feature is on a frozen layer, make the object totally - // hidden so it won't reappear if we regenerate the style string again - // during block insertion - if (iHidden == 2) - oStyleProperties["Hidden"] = "1"; + // If this feature is on a frozen layer (other than layer 0), make the + // object totally hidden so it won't reappear if we regenerate the style + // string again during block insertion + if (iHidden == 2 && !EQUAL(GetFieldAsString("Layer"), "0")) + oStyleProperties["Hidden"] = "1"; + } // Helpful constants const int C_BYLAYER = 256; From 504f825c9a6832d9074c472491cac71c9f687d3a Mon Sep 17 00:00:00 2001 From: Even Rouault Date: Mon, 17 Feb 2025 19:33:59 +0100 Subject: [PATCH 3/9] Formatting fix --- ogr/ogrct.cpp | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/ogr/ogrct.cpp b/ogr/ogrct.cpp index d1310fa89dfd..f04c993677c2 100644 --- a/ogr/ogrct.cpp +++ b/ogr/ogrct.cpp @@ -1261,9 +1261,9 @@ OGRProjCT::OGRProjCT(const OGRProjCT &other) m_osTargetSRS(other.m_osTargetSRS), bWebMercatorToWGS84LongLat(other.bWebMercatorToWGS84LongLat), nErrorCount(other.nErrorCount), dfThreshold(other.dfThreshold), - m_pj(other.m_pj), - m_bReversePj(other.m_bReversePj), m_bEmitErrors(other.m_bEmitErrors), - bNoTransform(other.bNoTransform), m_eStrategy(other.m_eStrategy), + m_pj(other.m_pj), m_bReversePj(other.m_bReversePj), + m_bEmitErrors(other.m_bEmitErrors), bNoTransform(other.bNoTransform), + m_eStrategy(other.m_eStrategy), m_oTransformations(other.m_oTransformations), m_iCurTransformation(other.m_iCurTransformation), m_options(other.m_options) From b026b4c0e17edf511c4173f929718cde33376fb5 Mon Sep 17 00:00:00 2001 From: Alessandro Pasotti Date: Tue, 18 Feb 2025 16:38:45 +0100 Subject: [PATCH 4/9] CPLTurnFailureIntoWarning backuper (#11859) Small utility class to set TurnFailureIntoWarning and restore it when deleted. Fix #11831 --- alg/gdaltransformer.cpp | 31 +++++++++++++------------ doc/Makefile | 4 ++-- frmts/gtiff/gtiffdataset_read.cpp | 15 +++++++----- frmts/safe/safedataset.cpp | 13 +++++++---- gcore/gdal_misc.cpp | 6 ++--- ogr/ogrsf_frmts/adbc/ogradbcdataset.cpp | 6 ++--- port/cpl_error.h | 17 ++++++++++++++ 7 files changed, 56 insertions(+), 36 deletions(-) diff --git a/alg/gdaltransformer.cpp b/alg/gdaltransformer.cpp index 08c059d9149f..cb180d8ba464 100644 --- a/alg/gdaltransformer.cpp +++ b/alg/gdaltransformer.cpp @@ -524,11 +524,11 @@ CPLErr CPL_STDCALL GDALSuggestedWarpOutput2(GDALDatasetH hSrcDS, /* -------------------------------------------------------------------- */ /* Transform them to the output coordinate system. */ /* -------------------------------------------------------------------- */ - CPLTurnFailureIntoWarning(true); - pfnTransformer(pTransformArg, FALSE, nSamplePoints, padfX, padfY, padfZ, - pabSuccess); - CPLTurnFailureIntoWarning(false); - + { + CPLTurnFailureIntoWarningBackuper oErrorsToWarnings{}; + pfnTransformer(pTransformArg, FALSE, nSamplePoints, padfX, padfY, padfZ, + pabSuccess); + } constexpr int SIGN_FINAL_UNINIT = -2; constexpr int SIGN_FINAL_INVALID = 0; int iSignDiscontinuity = SIGN_FINAL_UNINIT; @@ -588,7 +588,7 @@ CPLErr CPL_STDCALL GDALSuggestedWarpOutput2(GDALDatasetH hSrcDS, double ayTemp[2] = {padfY[i], padfY[i]}; double azTemp[2] = {padfZ[i], padfZ[i]}; int abSuccess[2] = {FALSE, FALSE}; - CPLTurnFailureIntoWarning(true); + CPLTurnFailureIntoWarningBackuper oErrorsToWarnings{}; if (pfnTransformer(pTransformArg, TRUE, 2, axTemp, ayTemp, azTemp, abSuccess) && fabs(axTemp[0] - axTemp[1]) < 1e-8 && @@ -596,7 +596,6 @@ CPLErr CPL_STDCALL GDALSuggestedWarpOutput2(GDALDatasetH hSrcDS, { padfX[i] = iSignDiscontinuity * 180.0; } - CPLTurnFailureIntoWarning(false); } } } @@ -615,10 +614,11 @@ CPLErr CPL_STDCALL GDALSuggestedWarpOutput2(GDALDatasetH hSrcDS, memcpy(padfXRevert, padfX, nSamplePoints * sizeof(double)); memcpy(padfYRevert, padfY, nSamplePoints * sizeof(double)); memcpy(padfZRevert, padfZ, nSamplePoints * sizeof(double)); - CPLTurnFailureIntoWarning(true); - pfnTransformer(pTransformArg, TRUE, nSamplePoints, padfXRevert, - padfYRevert, padfZRevert, pabSuccess); - CPLTurnFailureIntoWarning(false); + { + CPLTurnFailureIntoWarningBackuper oErrorsToWarnings{}; + pfnTransformer(pTransformArg, TRUE, nSamplePoints, padfXRevert, + padfYRevert, padfZRevert, pabSuccess); + } for (int i = 0; nFailedCount == 0 && i < nSamplePoints; i++) { @@ -693,10 +693,11 @@ CPLErr CPL_STDCALL GDALSuggestedWarpOutput2(GDALDatasetH hSrcDS, CPLAssert(nSamplePoints == nSampleMax); - CPLTurnFailureIntoWarning(true); - pfnTransformer(pTransformArg, FALSE, nSamplePoints, padfX, padfY, padfZ, - pabSuccess); - CPLTurnFailureIntoWarning(false); + { + CPLTurnFailureIntoWarningBackuper oErrorsToWarnings{}; + pfnTransformer(pTransformArg, FALSE, nSamplePoints, padfX, padfY, + padfZ, pabSuccess); + } } /* -------------------------------------------------------------------- */ diff --git a/doc/Makefile b/doc/Makefile index aa59f735c2e0..be1b5e0e353a 100644 --- a/doc/Makefile +++ b/doc/Makefile @@ -29,7 +29,7 @@ doxygen: doxygen_check_warnings: @echo "Checking that Doxygen runs without warnings..." @$(MAKE) -B $(BUILDDIR)/.doxygen_up_to_date > /tmp/doxygen_gdal_log.txt 2>&1 - @if grep -i warning /tmp/doxygen_gdal_log.txt; then \ + @if grep "warning:" /tmp/doxygen_gdal_log.txt; then \ echo "Doxygen warnings found!"; \ echo "---------"; \ echo "Full log:"; \ @@ -39,7 +39,7 @@ doxygen_check_warnings: echo "--------------------"; \ echo "Extract of warnings:"; \ echo "--------------------"; \ - grep -i warning /tmp/doxygen_gdal_log.txt; \ + grep "warning:" /tmp/doxygen_gdal_log.txt; \ echo "-----------------------"; \ echo "Doxygen warnings found!"; \ /bin/false; \ diff --git a/frmts/gtiff/gtiffdataset_read.cpp b/frmts/gtiff/gtiffdataset_read.cpp index 21829c59d540..13c4a30f8e57 100644 --- a/frmts/gtiff/gtiffdataset_read.cpp +++ b/frmts/gtiff/gtiffdataset_read.cpp @@ -7123,12 +7123,15 @@ void *GTiffDataset::CacheMultiRange(int nXOff, int nYOff, int nXSize, // as this method is an optimization, and if it fails, // tile-by-tile data acquisition will be done, so we can // temporary turn failures into warnings. - CPLTurnFailureIntoWarning(true); - const bool ok = - VSIFReadMultiRangeL(static_cast(anSizes.size()), - &apData[0], &anOffsets[0], &anSizes[0], - fp) == 0; - CPLTurnFailureIntoWarning(false); + bool ok; + { + CPLTurnFailureIntoWarningBackuper + oFailureToWarninBackuper{}; + ok = VSIFReadMultiRangeL(static_cast(anSizes.size()), + &apData[0], &anOffsets[0], + &anSizes[0], fp) == 0; + } + if (ok) { if (!oMapStrileToOffsetByteCount.empty() && diff --git a/frmts/safe/safedataset.cpp b/frmts/safe/safedataset.cpp index a0c9ad98b1b0..640fa07ecd76 100644 --- a/frmts/safe/safedataset.cpp +++ b/frmts/safe/safedataset.cpp @@ -1297,11 +1297,14 @@ GDALDataset *SAFEDataset::Open(GDALOpenInfo *poOpenInfo) /* Try and open the file. */ /* -------------------------------------------------------------------- */ - CPLTurnFailureIntoWarning(true); - auto poBandFile = std::unique_ptr( - GDALDataset::Open(osFullFilename.c_str(), - GDAL_OF_RASTER | GDAL_OF_VERBOSE_ERROR)); - CPLTurnFailureIntoWarning(false); + std::unique_ptr poBandFile; + { + CPLTurnFailureIntoWarningBackuper oErrorsToWarnings{}; + poBandFile = std::unique_ptr( + GDALDataset::Open(osFullFilename.c_str(), + GDAL_OF_RASTER | GDAL_OF_VERBOSE_ERROR)); + } + if (poBandFile == nullptr) { // NOP diff --git a/gcore/gdal_misc.cpp b/gcore/gdal_misc.cpp index 98353426cebe..5159ccc90130 100644 --- a/gcore/gdal_misc.cpp +++ b/gcore/gdal_misc.cpp @@ -4518,14 +4518,13 @@ GDALDataset *GDALFindAssociatedAuxFile(const char *pszBasename, /* Avoid causing failure in opening of main file from SWIG bindings */ /* when auxiliary file cannot be opened (#3269) */ - CPLTurnFailureIntoWarning(TRUE); + CPLTurnFailureIntoWarningBackuper oErrorsToWarnings{}; if (poDependentDS != nullptr && poDependentDS->GetShared()) poODS = GDALDataset::FromHandle( GDALOpenShared(osAuxFilename, eAccess)); else poODS = GDALDataset::FromHandle(GDALOpen(osAuxFilename, eAccess)); - CPLTurnFailureIntoWarning(FALSE); } CPL_IGNORE_RET_VAL(VSIFCloseL(fp)); } @@ -4618,14 +4617,13 @@ GDALDataset *GDALFindAssociatedAuxFile(const char *pszBasename, /* Avoid causing failure in opening of main file from SWIG * bindings */ /* when auxiliary file cannot be opened (#3269) */ - CPLTurnFailureIntoWarning(TRUE); + CPLTurnFailureIntoWarningBackuper oErrorsToWarnings{}; if (poDependentDS != nullptr && poDependentDS->GetShared()) poODS = GDALDataset::FromHandle( GDALOpenShared(osAuxFilename, eAccess)); else poODS = GDALDataset::FromHandle( GDALOpen(osAuxFilename, eAccess)); - CPLTurnFailureIntoWarning(FALSE); } CPL_IGNORE_RET_VAL(VSIFCloseL(fp)); } diff --git a/ogr/ogrsf_frmts/adbc/ogradbcdataset.cpp b/ogr/ogrsf_frmts/adbc/ogradbcdataset.cpp index 68085054ba87..6b0ad96441ce 100644 --- a/ogr/ogrsf_frmts/adbc/ogradbcdataset.cpp +++ b/ogr/ogrsf_frmts/adbc/ogradbcdataset.cpp @@ -518,10 +518,9 @@ bool OGRADBCDataset::Open(const GDALOpenInfo *poOpenInfo) const std::string osStatement = CPLSPrintf("SELECT * FROM \"%s\"", OGRDuplicateCharacter(pszLayerName, '"').c_str()); - CPLTurnFailureIntoWarning(true); + CPLTurnFailureIntoWarningBackuper oErrorsToWarnings{}; auto poLayer = CreateLayer(osStatement.c_str(), pszLayerName, false); - CPLTurnFailureIntoWarning(false); if (poLayer) { m_apoLayers.emplace_back(std::move(poLayer)); @@ -550,11 +549,10 @@ bool OGRADBCDataset::Open(const GDALOpenInfo *poOpenInfo) OGRDuplicateCharacter(pszNamespace, '"').c_str(), OGRDuplicateCharacter(pszTableName, '"').c_str()); - CPLTurnFailureIntoWarning(true); + CPLTurnFailureIntoWarningBackuper oErrorsToWarnings{}; auto poLayer = CreateLayer( osStatement.c_str(), CPLSPrintf("%s.%s", pszNamespace, pszTableName), false); - CPLTurnFailureIntoWarning(false); if (poLayer) { m_apoLayers.emplace_back(std::move(poLayer)); diff --git a/port/cpl_error.h b/port/cpl_error.h index 63eaa6f3c37b..7eec97aab3c1 100644 --- a/port/cpl_error.h +++ b/port/cpl_error.h @@ -377,6 +377,23 @@ extern "C++" */ ~CPLErrorStateBackuper(); }; + + /** Class that turns errors into warning on construction, and + * restores the previous state on destruction. + */ + class CPL_DLL CPLTurnFailureIntoWarningBackuper + { + public: + CPLTurnFailureIntoWarningBackuper() + { + CPLTurnFailureIntoWarning(true); + } + + ~CPLTurnFailureIntoWarningBackuper() + { + CPLTurnFailureIntoWarning(false); + } + }; } #ifdef GDAL_COMPILATION From 61594858d3121b308edcf392b087880ec3bcf318 Mon Sep 17 00:00:00 2001 From: Dmitry Baryshnikov Date: Tue, 18 Feb 2025 19:18:18 +0300 Subject: [PATCH 5/9] NGW: Fix Coverity Scan defects in NGW driver (#11861) --- ogr/ogrsf_frmts/ngw/gdalngwdataset.cpp | 10 +-- ogr/ogrsf_frmts/ngw/ngw_api.cpp | 88 +++++++++++++------------- ogr/ogrsf_frmts/ngw/ogrngwlayer.cpp | 2 +- 3 files changed, 49 insertions(+), 51 deletions(-) diff --git a/ogr/ogrsf_frmts/ngw/gdalngwdataset.cpp b/ogr/ogrsf_frmts/ngw/gdalngwdataset.cpp index e958870b6454..e272b9f41a1a 100644 --- a/ogr/ogrsf_frmts/ngw/gdalngwdataset.cpp +++ b/ogr/ogrsf_frmts/ngw/gdalngwdataset.cpp @@ -93,7 +93,7 @@ static std::string GetStylesIdentifiers(const CPLJSONArray &aoStyles, int nDeep) { if (sOut.empty()) { - sOut = sId; + sOut = std::move(sId); } else { @@ -109,7 +109,7 @@ static std::string GetStylesIdentifiers(const CPLJSONArray &aoStyles, int nDeep) { if (sOut.empty()) { - sOut = sId; + sOut = std::move(sId); } else { @@ -1682,7 +1682,7 @@ bool OGRNGWDataset::DeleteFieldDomain(const std::string &name, /* * CreateNGWLookupTableJson() */ -static std::string CreateNGWLookupTableJson(OGRCodedFieldDomain *pDomain, +static std::string CreateNGWLookupTableJson(const OGRCodedFieldDomain *pDomain, GIntBig nResourceId) { CPLJSONObject oResourceJson; @@ -1801,7 +1801,7 @@ bool OGRNGWDataset::UpdateFieldDomain(std::unique_ptr &&domain, } auto osPayload = CreateNGWLookupTableJson( - dynamic_cast(domain.get()), + dynamic_cast(domain.get()), static_cast(std::stol(osResourceId))); if (!NGWAPI::UpdateResource(osUrl, osResourceId, osPayload, GetHeaders())) @@ -1851,7 +1851,7 @@ OGRNGWCodedFieldDomain OGRNGWDataset::GetDomainByID(GIntBig id) const */ GIntBig OGRNGWDataset::GetDomainIdByName(const std::string &osDomainName) const { - for (auto oDom : moDomains) + for (auto const &oDom : moDomains) { if (oDom.second.HasDomainName(osDomainName)) { diff --git a/ogr/ogrsf_frmts/ngw/ngw_api.cpp b/ogr/ogrsf_frmts/ngw/ngw_api.cpp index 891fa7f423ef..4f80e84c694a 100644 --- a/ogr/ogrsf_frmts/ngw/ngw_api.cpp +++ b/ogr/ogrsf_frmts/ngw/ngw_api.cpp @@ -20,13 +20,19 @@ namespace NGWAPI { -static bool ReportErrorToCPL(const std::string &osErrorMessage) +static std::string GetErrorMessage(const CPLJSONObject &oRoot, + const std::string &osErrorMessage) { - CPLError(CE_Failure, CPLE_AppDefined, - "NGW driver failed to fetch data with error: %s", - osErrorMessage.c_str()); - - return false; + if (oRoot.IsValid()) + { + std::string osErrorMessageInt = + oRoot.GetString("message", osErrorMessage); + if (!osErrorMessageInt.empty()) + { + return osErrorMessageInt; + } + } + return osErrorMessage; } bool CheckRequestResult(bool bResult, const CPLJSONObject &oRoot, @@ -34,26 +40,33 @@ bool CheckRequestResult(bool bResult, const CPLJSONObject &oRoot, { if (!bResult) { - if (oRoot.IsValid()) - { - std::string osErrorMessageInt = - oRoot.GetString("message", osErrorMessage); - if (!osErrorMessageInt.empty()) - { - return ReportErrorToCPL(osErrorMessageInt); - } - } - return ReportErrorToCPL(osErrorMessage); - } + auto osMsg = GetErrorMessage(oRoot, osErrorMessage); - if (!oRoot.IsValid()) - { - return ReportErrorToCPL(osErrorMessage); + CPLError(CE_Failure, CPLE_AppDefined, + "NGW driver failed to fetch data with error: %s", + osMsg.c_str()); + return false; } return true; } +static void ReportError(const GByte *pabyData, int nDataLen, + const std::string &osErrorMessage) +{ + CPLJSONDocument oResult; + if (oResult.LoadMemory(pabyData, nDataLen)) + { + CPLJSONObject oRoot = oResult.GetRoot(); + auto osMsg = GetErrorMessage(oRoot, osErrorMessage); + CPLError(CE_Failure, CPLE_AppDefined, "%s", osMsg.c_str()); + } + else + { + CPLError(CE_Failure, CPLE_AppDefined, "%s", osErrorMessage.c_str()); + } +} + bool CheckSupportedType(bool bIsRaster, const std::string &osType) { //TODO: Add "raster_mosaic", "tileset", "wfsserver_service" and "wmsserver_service" @@ -169,16 +182,6 @@ GetFeaturePageURL(const std::string &osUrl, const std::string &osResourceId, } } - if (bParamAdd) - { - osFeatureUrl += "&extensions=" + osExtensions; - } - else - { - osFeatureUrl += "?extensions=" + osExtensions; - bParamAdd = true; - } - if (IsGeometryIgnored) { if (bParamAdd) @@ -188,9 +191,19 @@ GetFeaturePageURL(const std::string &osUrl, const std::string &osResourceId, else { osFeatureUrl += "?geom=no"; + bParamAdd = true; } } + if (bParamAdd) + { + osFeatureUrl += "&extensions=" + osExtensions; + } + else + { + osFeatureUrl += "?extensions=" + osExtensions; + } + return osFeatureUrl; } @@ -281,21 +294,6 @@ Uri ParseUri(const std::string &osUrl) return stOut; } -static void ReportError(const GByte *pabyData, int nDataLen, - const std::string &osErrorMessage) -{ - CPLJSONDocument oResult; - if (oResult.LoadMemory(pabyData, nDataLen)) - { - CPLJSONObject oRoot = oResult.GetRoot(); - CheckRequestResult(false, oRoot, osErrorMessage); - } - else - { - CPLError(CE_Failure, CPLE_AppDefined, "%s", osErrorMessage.c_str()); - } -} - std::string CreateResource(const std::string &osUrl, const std::string &osPayload, const CPLStringList &aosHTTPOptions) diff --git a/ogr/ogrsf_frmts/ngw/ogrngwlayer.cpp b/ogr/ogrsf_frmts/ngw/ogrngwlayer.cpp index 8d8d287911f3..d20c6d6ba137 100644 --- a/ogr/ogrsf_frmts/ngw/ogrngwlayer.cpp +++ b/ogr/ogrsf_frmts/ngw/ogrngwlayer.cpp @@ -1310,7 +1310,7 @@ std::string OGRNGWLayer::CreateNGWResourceJson() { OGRFieldDefn *poFieldDefn = poFeatureDefn->GetFieldDefn(iField); CPLJSONObject oField; - auto sComment = poFieldDefn->GetComment(); + auto const &sComment = poFieldDefn->GetComment(); if (!sComment.empty()) { CPLJSONDocument oComment; From 027f3ca6487004004b1f6595a69a02fb3e858c16 Mon Sep 17 00:00:00 2001 From: Dan Baston Date: Tue, 18 Feb 2025 11:33:02 -0500 Subject: [PATCH 6/9] Add 'gdal raster calc' (#11850) --- apps/CMakeLists.txt | 1 + apps/gdalalg_raster.cpp | 2 + apps/gdalalg_raster_calc.cpp | 620 ++++++++++++++++++ apps/gdalalg_raster_calc.h | 54 ++ autotest/gdrivers/vrtderived.py | 11 +- .../utilities/test_gdalalg_raster_calc.py | 431 ++++++++++++ doc/source/programs/gdal_raster.rst | 2 + doc/source/programs/gdal_raster_calc.rst | 104 +++ doc/source/programs/index.rst | 2 + frmts/vrt/vrtexpression_muparser.cpp | 85 ++- frmts/vrt/vrtsources.cpp | 5 + gcore/gdalalgorithm.h | 2 +- swig/include/python/gdal_python.i | 4 + 13 files changed, 1310 insertions(+), 13 deletions(-) create mode 100644 apps/gdalalg_raster_calc.cpp create mode 100644 apps/gdalalg_raster_calc.h create mode 100755 autotest/utilities/test_gdalalg_raster_calc.py create mode 100644 doc/source/programs/gdal_raster_calc.rst diff --git a/apps/CMakeLists.txt b/apps/CMakeLists.txt index 530bd8eecf07..fefb8d67791d 100644 --- a/apps/CMakeLists.txt +++ b/apps/CMakeLists.txt @@ -12,6 +12,7 @@ add_library( gdalalg_pipeline.cpp gdalalg_raster.cpp gdalalg_raster_info.cpp + gdalalg_raster_calc.cpp gdalalg_raster_clip.cpp gdalalg_raster_convert.cpp gdalalg_raster_edit.cpp diff --git a/apps/gdalalg_raster.cpp b/apps/gdalalg_raster.cpp index ba68d40d55ca..769c9a9b4850 100644 --- a/apps/gdalalg_raster.cpp +++ b/apps/gdalalg_raster.cpp @@ -13,6 +13,7 @@ #include "gdalalgorithm.h" #include "gdalalg_raster_info.h" +#include "gdalalg_raster_calc.h" #include "gdalalg_raster_clip.h" #include "gdalalg_raster_convert.h" #include "gdalalg_raster_edit.h" @@ -41,6 +42,7 @@ class GDALRasterAlgorithm final : public GDALAlgorithm GDALRasterAlgorithm() : GDALAlgorithm(NAME, DESCRIPTION, HELP_URL) { RegisterSubAlgorithm(); + RegisterSubAlgorithm(); RegisterSubAlgorithm(); RegisterSubAlgorithm(); RegisterSubAlgorithm(); diff --git a/apps/gdalalg_raster_calc.cpp b/apps/gdalalg_raster_calc.cpp new file mode 100644 index 000000000000..8b7650eb8442 --- /dev/null +++ b/apps/gdalalg_raster_calc.cpp @@ -0,0 +1,620 @@ +/****************************************************************************** + * + * Project: GDAL + * Purpose: "gdal raster calc" subcommand + * Author: Daniel Baston + * + ****************************************************************************** + * Copyright (c) 2025, ISciences LLC + * + * SPDX-License-Identifier: MIT + ****************************************************************************/ + +#include "gdalalg_raster_calc.h" + +#include "../frmts/vrt/gdal_vrt.h" +#include "../frmts/vrt/vrtdataset.h" + +#include "gdal_priv.h" +#include "gdal_utils.h" + +#include +#include +#include + +//! @cond Doxygen_Suppress + +#ifndef _ +#define _(x) (x) +#endif + +struct GDALCalcOptions +{ + bool checkSRS{true}; + bool checkExtent{true}; +}; + +static bool MatchIsCompleteVariableNameWithNoIndex(const std::string &str, + size_t from, size_t to) +{ + if (to < str.size()) + { + // If the character after the end of the match is: + // * alphanumeric or _ : we've matched only part of a variable name + // * [ : we've matched a variable that already has an index + // * ( : we've matched a function name + if (std::isalnum(str[to]) || str[to] == '_' || str[to] == '[' || + str[to] == '(') + { + return false; + } + } + if (from > 0) + { + // If the character before the start of the match is alphanumeric or _, + // we've matched only part of a variable name. + if (std::isalnum(str[from - 1]) || str[from - 1] == '_') + { + return false; + } + } + + return true; +} + +/** + * Add a band subscript to all instances of a specified variable that + * do not already have such a subscript. For example, "X" would be + * replaced with "X[3]" but "X[1]" would be left untouched. + */ +static std::string SetBandIndices(const std::string &origExpression, + const std::string &variable, int band, + bool &expressionChanged) +{ + std::string expression = origExpression; + expressionChanged = false; + + std::string::size_type seekPos = 0; + auto pos = expression.find(variable, seekPos); + while (pos != std::string::npos) + { + auto end = pos + variable.size(); + + if (MatchIsCompleteVariableNameWithNoIndex(expression, pos, end)) + { + // No index specified for variable + expression = expression.substr(0, pos + variable.size()) + '[' + + std::to_string(band) + ']' + expression.substr(end); + expressionChanged = true; + } + + seekPos = end; + pos = expression.find(variable, seekPos); + } + + return expression; +} + +struct SourceProperties +{ + int nBands{0}; + int nX{0}; + int nY{0}; + std::array gt{}; + std::unique_ptr srs{ + nullptr}; +}; + +static std::optional +UpdateSourceProperties(SourceProperties &out, const std::string &dsn, + const GDALCalcOptions &options) +{ + SourceProperties source; + bool srsMismatch = false; + bool extentMismatch = false; + bool dimensionMismatch = false; + + { + std::unique_ptr ds( + GDALDataset::Open(dsn.c_str(), GDAL_OF_RASTER)); + + if (!ds) + { + CPLError(CE_Failure, CPLE_AppDefined, "Failed to open %s", + dsn.c_str()); + return std::nullopt; + } + + source.nBands = ds->GetRasterCount(); + source.nX = ds->GetRasterXSize(); + source.nY = ds->GetRasterYSize(); + + if (options.checkExtent) + { + ds->GetGeoTransform(source.gt.data()); + } + + if (options.checkSRS && out.srs) + { + const OGRSpatialReference *srs = ds->GetSpatialRef(); + srsMismatch = srs && !srs->IsSame(out.srs.get()); + } + } + + if (source.nX != out.nX || source.nY != out.nY) + { + dimensionMismatch = true; + } + + if (source.gt[0] != out.gt[0] || source.gt[2] != out.gt[2] || + source.gt[3] != out.gt[3] || source.gt[4] != out.gt[4]) + { + extentMismatch = true; + } + if (source.gt[1] != out.gt[1] || source.gt[5] != out.gt[5]) + { + // Resolutions are different. Are the extents the same? + double xmaxOut = out.gt[0] + out.nX * out.gt[1] + out.nY * out.gt[2]; + double yminOut = out.gt[3] + out.nX * out.gt[4] + out.nY * out.gt[5]; + + double xmax = + source.gt[0] + source.nX * source.gt[1] + source.nY * source.gt[2]; + double ymin = + source.gt[3] + source.nX * source.gt[4] + source.nY * source.gt[5]; + + // TODO use a tolerance here + if (xmax != xmaxOut || ymin != yminOut) + { + extentMismatch = true; + } + } + + if (options.checkExtent && extentMismatch) + { + CPLError(CE_Failure, CPLE_AppDefined, + "Input extents are inconsistent."); + return std::nullopt; + } + + if (!options.checkExtent && dimensionMismatch) + { + CPLError(CE_Failure, CPLE_AppDefined, + "Inputs do not have the same dimensions."); + return std::nullopt; + } + + // Choose the finest resolution + // TODO modify to use common resolution (https://github.com/OSGeo/gdal/issues/11497) + if (source.nX > out.nX) + { + out.nX = source.nX; + out.gt[1] = source.gt[1]; + } + if (source.nY > out.nY) + { + out.nY = source.nY; + out.gt[5] = source.gt[5]; + } + + if (srsMismatch) + { + CPLError(CE_Failure, CPLE_AppDefined, + "Input spatial reference systems are inconsistent."); + return std::nullopt; + } + + return source; +} + +/** Create XML nodes for one or more derived bands resulting from the evaluation + * of a single expression + * + * @param root VRTDataset node to which the band nodes should be added + * @param nXOut Number of columns in VRT dataset + * @param nYOut Number of rows in VRT dataset + * @param expression Expression for which band(s) should be added + * @param sources Mapping of source names to DSNs + * @param sourceProps Mapping of source names to properties + * @return true if the band(s) were added, false otherwise + */ +static bool +CreateDerivedBandXML(CPLXMLNode *root, int nXOut, int nYOut, + const std::string &expression, + const std::map &sources, + const std::map &sourceProps) +{ + int nOutBands = 1; // By default, each expression produces a single output + // band. When processing the expression below, we may + // discover that the expression produces multiple bands, + // in which case this will be updated. + for (int nOutBand = 1; nOutBand <= nOutBands; nOutBand++) + { + // Copy the expression for each output band, because we may modify it + // when adding band indices (e.g., X -> X[1]) to the variables in the + // expression. + std::string bandExpression = expression; + + CPLXMLNode *band = CPLCreateXMLNode(root, CXT_Element, "VRTRasterBand"); + CPLAddXMLAttributeAndValue(band, "subClass", "VRTDerivedRasterBand"); + // TODO: Allow user specification of output data type? + CPLAddXMLAttributeAndValue(band, "dataType", "Float64"); + + CPLXMLNode *pixelFunctionType = + CPLCreateXMLNode(band, CXT_Element, "PixelFunctionType"); + CPLCreateXMLNode(pixelFunctionType, CXT_Text, "expression"); + CPLXMLNode *arguments = + CPLCreateXMLNode(band, CXT_Element, "PixelFunctionArguments"); + + for (const auto &[source_name, dsn] : sources) + { + auto it = sourceProps.find(source_name); + CPLAssert(it != sourceProps.end()); + const auto &props = it->second; + + { + const int nDefaultInBand = std::min(props.nBands, nOutBand); + + CPLString expressionBandVariable; + expressionBandVariable.Printf("%s[%d]", source_name.c_str(), + nDefaultInBand); + + bool expressionUsesAllBands = false; + bandExpression = + SetBandIndices(bandExpression, source_name, nDefaultInBand, + expressionUsesAllBands); + + if (expressionUsesAllBands) + { + if (nOutBands <= 1) + { + nOutBands = props.nBands; + } + else if (props.nBands != 1 && props.nBands != nOutBands) + { + CPLError(CE_Failure, CPLE_AppDefined, + "Expression cannot operate on all bands of " + "rasters with incompatible numbers of bands " + "(source %s has %d bands but expected to have " + "1 or %d bands).", + source_name.c_str(), props.nBands, nOutBands); + return false; + } + } + } + + // Create a for each input band that is used in + // the expression. + for (int nInBand = 1; nInBand <= props.nBands; nInBand++) + { + CPLString inBandVariable; + inBandVariable.Printf("%s[%d]", source_name.c_str(), nInBand); + if (bandExpression.find(inBandVariable) == std::string::npos) + { + continue; + } + + CPLXMLNode *source = + CPLCreateXMLNode(band, CXT_Element, "SimpleSource"); + CPLAddXMLAttributeAndValue(source, "name", + inBandVariable.c_str()); + + CPLXMLNode *sourceFilename = + CPLCreateXMLNode(source, CXT_Element, "SourceFilename"); + CPLAddXMLAttributeAndValue(sourceFilename, "relativeToVRT", + "0"); + CPLCreateXMLNode(sourceFilename, CXT_Text, dsn.c_str()); + + CPLXMLNode *sourceBand = + CPLCreateXMLNode(source, CXT_Element, "SourceBand"); + CPLCreateXMLNode(sourceBand, CXT_Text, + std::to_string(nInBand).c_str()); + + // TODO add ? + + CPLXMLNode *srcRect = + CPLCreateXMLNode(source, CXT_Element, "SrcRect"); + CPLAddXMLAttributeAndValue(srcRect, "xOff", "0"); + CPLAddXMLAttributeAndValue(srcRect, "yOff", "0"); + CPLAddXMLAttributeAndValue(srcRect, "xSize", + std::to_string(props.nX).c_str()); + CPLAddXMLAttributeAndValue(srcRect, "ySize", + std::to_string(props.nY).c_str()); + + CPLXMLNode *dstRect = + CPLCreateXMLNode(source, CXT_Element, "DstRect"); + CPLAddXMLAttributeAndValue(dstRect, "xOff", "0"); + CPLAddXMLAttributeAndValue(dstRect, "yOff", "0"); + CPLAddXMLAttributeAndValue(dstRect, "xSize", + std::to_string(nXOut).c_str()); + CPLAddXMLAttributeAndValue(dstRect, "ySize", + std::to_string(nYOut).c_str()); + } + } + + // Add the expression as a last step, because we may modify the + // expression as we iterate through the bands. + CPLAddXMLAttributeAndValue(arguments, "expression", + bandExpression.c_str()); + CPLAddXMLAttributeAndValue(arguments, "dialect", "muparser"); + } + + return true; +} + +static bool ParseSourceDescriptors(const std::vector &inputs, + std::map &datasets, + std::string &firstSourceName) +{ + bool isFirst = true; + + for (const auto &input : inputs) + { + std::string name = ""; + + auto pos = input.find('='); + if (pos == std::string::npos) + { + if (inputs.size() > 1) + { + CPLError(CE_Failure, CPLE_AppDefined, + "Inputs must be named when more than one input is " + "provided."); + return false; + } + name = "X"; + } + else + { + name = input.substr(0, pos); + } + + std::string dsn = + (pos == std::string::npos) ? input : input.substr(pos + 1); + datasets[name] = std::move(dsn); + + if (isFirst) + { + firstSourceName = name; + isFirst = false; + } + } + + return true; +} + +static bool ReadFileLists(std::vector &inputs) +{ + for (std::size_t i = 0; i < inputs.size(); i++) + { + const auto &input = inputs[i]; + if (input[0] == '@') + { + auto f = + VSIVirtualHandleUniquePtr(VSIFOpenL(input.c_str() + 1, "r")); + if (!f) + { + CPLError(CE_Failure, CPLE_FileIO, "Cannot open %s", + input.c_str() + 1); + return false; + } + std::vector sources; + while (const char *filename = CPLReadLineL(f.get())) + { + sources.push_back(filename); + } + inputs.erase(inputs.begin() + static_cast(i)); + inputs.insert(inputs.end(), sources.begin(), sources.end()); + } + } + + return true; +} + +/** Creates a VRT datasource with one or more derived raster bands containing + * results of an expression. + * + * To make this work with muparser (which does not support vector types), we + * do a simple parsing of the expression internally, transforming it into + * multiple expressions with explicit band indices. For example, for a two-band + * raster "X", the expression "X + 3" will be transformed into "X[1] + 3" and + * "X[2] + 3". The use of brackets is for readability only; as far as the + * expression engine is concerned, the variables "X[1]" and "X[2]" have nothing + * to do with each other. + * + * @param inputs A list of sources, expressed as NAME=DSN + * @param expressions A list of expressions to be evaluated + * @param options flags controlling which checks should be performed on the inputs + * + * @return a newly created VRTDataset, or nullptr on error + */ +static std::unique_ptr +GDALCalcCreateVRTDerived(const std::vector &inputs, + const std::vector &expressions, + const GDALCalcOptions &options) +{ + if (inputs.empty()) + { + return nullptr; + } + + std::map sources; + std::string firstSource; + if (!ParseSourceDescriptors(inputs, sources, firstSource)) + { + return nullptr; + } + + // Use the first source provided to determine properties of the output + const char *firstDSN = sources[firstSource].c_str(); + + // Read properties from the first source + SourceProperties out; + { + std::unique_ptr ds( + GDALDataset::Open(firstDSN, GDAL_OF_RASTER)); + + if (!ds) + { + CPLError(CE_Failure, CPLE_AppDefined, "Failed to open %s", + firstDSN); + return nullptr; + } + + out.nX = ds->GetRasterXSize(); + out.nY = ds->GetRasterYSize(); + out.nBands = 1; + out.srs.reset(ds->GetSpatialRef() ? ds->GetSpatialRef()->Clone() + : nullptr); + ds->GetGeoTransform(out.gt.data()); + } + + CPLXMLNode *root = CPLCreateXMLNode(nullptr, CXT_Element, "VRTDataset"); + + // Collect properties of the different sources, and verity them for + // consistency. + std::map sourceProps; + for (const auto &[source_name, dsn] : sources) + { + // TODO avoid opening the first source twice. + auto props = UpdateSourceProperties(out, dsn, options); + if (props.has_value()) + { + sourceProps[source_name] = std::move(props.value()); + } + else + { + return nullptr; + } + } + + for (const auto &origExpression : expressions) + { + if (!CreateDerivedBandXML(root, out.nX, out.nY, origExpression, sources, + sourceProps)) + { + return nullptr; + } + } + + //CPLDebug("VRT", "%s", CPLSerializeXMLTree(root)); + + auto ds = std::make_unique(out.nX, out.nY); + if (ds->XMLInit(root, "") != CE_None) + { + return nullptr; + }; + ds->SetGeoTransform(out.gt.data()); + if (out.srs) + { + ds->SetSpatialRef(OGRSpatialReference::FromHandle(out.srs.get())); + } + + return ds; +} + +/************************************************************************/ +/* GDALRasterEditAlgorithm::GDALRasterEditAlgorithm() */ +/************************************************************************/ + +GDALRasterCalcAlgorithm::GDALRasterCalcAlgorithm() noexcept + : GDALAlgorithm(NAME, DESCRIPTION, HELP_URL) +{ + AddProgressArg(); + + AddArg(GDAL_ARG_NAME_INPUT, 'i', _("Input raster datasets"), &m_inputs) + .SetMinCount(1) + .SetAutoOpenDataset(false) + .SetMetaVar("INPUTS"); + + AddOutputFormatArg(&m_format); + AddOutputDatasetArg(&m_outputDataset, GDAL_OF_RASTER); + AddCreationOptionsArg(&m_creationOptions); + AddOverwriteArg(&m_overwrite); + + AddArg("no-check-srs", 0, + _("Do not check consistency of input spatial reference systems"), + &m_NoCheckSRS); + AddArg("no-check-extent", 0, _("Do not check consistency of input extents"), + &m_NoCheckExtent); + + AddArg("calc", 0, _("Expression(s) to evaluate"), &m_expr).SetMinCount(1); +} + +/************************************************************************/ +/* GDALRasterCalcAlgorithm::RunImpl() */ +/************************************************************************/ + +bool GDALRasterCalcAlgorithm::RunImpl(GDALProgressFunc pfnProgress, + void *pProgressData) +{ + if (m_outputDataset.GetDatasetRef()) + { + CPLError(CE_Failure, CPLE_NotSupported, + "gdal raster calc does not support outputting to an " + "already opened output dataset"); + return false; + } + + VSIStatBufL sStat; + if (!m_overwrite && !m_outputDataset.GetName().empty() && + (VSIStatL(m_outputDataset.GetName().c_str(), &sStat) == 0 || + std::unique_ptr( + GDALDataset::Open(m_outputDataset.GetName().c_str())))) + { + ReportError(CE_Failure, CPLE_AppDefined, + "File '%s' already exists. Specify the --overwrite " + "option to overwrite it.", + m_outputDataset.GetName().c_str()); + return false; + } + + GDALCalcOptions options; + options.checkExtent = !m_NoCheckExtent; + options.checkSRS = !m_NoCheckSRS; + + if (!ReadFileLists(m_inputs)) + { + return false; + } + + auto vrt = GDALCalcCreateVRTDerived(m_inputs, m_expr, options); + + if (vrt == nullptr) + { + return false; + } + + CPLStringList translateArgs; + if (!m_format.empty()) + { + translateArgs.AddString("-of"); + translateArgs.AddString(m_format.c_str()); + } + for (const auto &co : m_creationOptions) + { + translateArgs.AddString("-co"); + translateArgs.AddString(co.c_str()); + } + + GDALTranslateOptions *translateOptions = + GDALTranslateOptionsNew(translateArgs.List(), nullptr); + GDALTranslateOptionsSetProgress(translateOptions, pfnProgress, + pProgressData); + + auto poOutDS = + std::unique_ptr(GDALDataset::FromHandle(GDALTranslate( + m_outputDataset.GetName().c_str(), GDALDataset::ToHandle(vrt.get()), + translateOptions, nullptr))); + GDALTranslateOptionsFree(translateOptions); + + if (!poOutDS) + { + return false; + } + + m_outputDataset.Set(std::move(poOutDS)); + + return true; +} + +//! @endcond diff --git a/apps/gdalalg_raster_calc.h b/apps/gdalalg_raster_calc.h new file mode 100644 index 000000000000..d99a2b20feed --- /dev/null +++ b/apps/gdalalg_raster_calc.h @@ -0,0 +1,54 @@ +/****************************************************************************** + * + * Project: GDAL + * Purpose: "calc" step of "raster pipeline" + * Author: Daniel Baston + * + ****************************************************************************** + * Copyright (c) 2025, ISciences LLC + * + * SPDX-License-Identifier: MIT + ****************************************************************************/ + +#ifndef GDALALG_RASTER_CALC_INCLUDED +#define GDALALG_RASTER_CALC_INCLUDED + +#include "gdalalg_raster_pipeline.h" + +//! @cond Doxygen_Suppress + +/************************************************************************/ +/* GDALRasterCalcAlgorithm */ +/************************************************************************/ + +class GDALRasterCalcAlgorithm : public GDALAlgorithm +{ + public: + explicit GDALRasterCalcAlgorithm() noexcept; + + static constexpr const char *NAME = "calc"; + static constexpr const char *DESCRIPTION = "Perform raster algebra"; + static constexpr const char *HELP_URL = "/programs/gdal_raster_calc.html"; + + static std::vector GetAliases() + { + return {}; + } + + private: + bool RunImpl(GDALProgressFunc pfnProgress, void *pProgressData) override; + + std::vector m_inputs{}; + GDALArgDatasetValue m_dataset{}; + std::vector m_expr{}; + GDALArgDatasetValue m_outputDataset{}; + std::string m_format{}; + std::vector m_creationOptions{}; + bool m_overwrite{false}; + bool m_NoCheckSRS{false}; + bool m_NoCheckExtent{false}; +}; + +//! @endcond + +#endif /* GDALALG_RASTER_CALC_INCLUDED */ diff --git a/autotest/gdrivers/vrtderived.py b/autotest/gdrivers/vrtderived.py index 90e955a8f806..52220fc4a09d 100755 --- a/autotest/gdrivers/vrtderived.py +++ b/autotest/gdrivers/vrtderived.py @@ -1222,6 +1222,13 @@ def vrt_expression_xml(tmpdir, expression, dialect, sources): ["exprtk"], id="expression returns nodata", ), + pytest.param( + "ZB[1] + B[1]", + [("ZB[1]", 7), ("B[1]", 3)], + 10, + ["muparser"], + id="index substitution works correctly", + ), ], ) @pytest.mark.parametrize("dialect", ("exprtk", "muparser")) @@ -1274,8 +1281,8 @@ def test_vrt_pixelfn_expression( id="expression is too long", ), pytest.param( - "B[1]", - [("B[1]", 3)], + "B@1", + [("B@1", 3)], "muparser", "Invalid variable name", id="invalid variable name", diff --git a/autotest/utilities/test_gdalalg_raster_calc.py b/autotest/utilities/test_gdalalg_raster_calc.py new file mode 100755 index 000000000000..00ae5b37332b --- /dev/null +++ b/autotest/utilities/test_gdalalg_raster_calc.py @@ -0,0 +1,431 @@ +#!/usr/bin/env pytest +# -*- coding: utf-8 -*- +############################################################################### +# Project: GDAL/OGR Test Suite +# Purpose: 'gdal raster calc' testing +# Author: Daniel Baston +# +############################################################################### +# Copyright (c) 2025, ISciences LLC +# +# SPDX-License-Identifier: MIT +############################################################################### + +import re + +import gdaltest +import pytest + +from osgeo import gdal + +gdal.UseExceptions() + + +@pytest.fixture(scope="module", autouse=True) +def require_muparser(): + if not gdaltest.gdal_has_vrt_expression_dialect("muparser"): + pytest.skip("muparser not available") + + +@pytest.fixture() +def calc(): + reg = gdal.GetGlobalAlgorithmRegistry() + raster = reg.InstantiateAlg("raster") + return raster.InstantiateSubAlgorithm("calc") + + +@pytest.mark.parametrize("output_format", ("tif", "vrt")) +def test_gdalalg_raster_calc_basic_1(calc, tmp_vsimem, output_format): + + np = pytest.importorskip("numpy") + + infile = "../gcore/data/rgbsmall.tif" + outfile = tmp_vsimem / "out.tif" + + calc["input"] = [infile] + calc["output"] = outfile + calc["calc"] = ["2 + X / (1 + sum(X[1], X[2], X[3]))"] + + assert calc.Run() + + with gdal.Open(infile) as src, gdal.Open(outfile) as dst: + srcval = src.ReadAsArray().astype("float64") + expected = np.apply_along_axis(lambda x: 2 + x / (1 + x.sum()), 0, srcval) + + np.testing.assert_array_equal(expected, dst.ReadAsArray()) + assert src.GetGeoTransform() == dst.GetGeoTransform() + assert src.GetSpatialRef().IsSame(dst.GetSpatialRef()) + + +@pytest.mark.parametrize("output_format", ("tif", "vrt")) +def test_gdalalg_raster_calc_basic_2(calc, tmp_vsimem, output_format): + + np = pytest.importorskip("numpy") + + infile = "../gcore/data/byte.tif" + outfile = tmp_vsimem / "out.tif" + + calc["input"] = [infile] + calc["output"] = outfile + calc["calc"] = ["X > 128 ? X + 3 : nan"] + + assert calc.Run() + + with gdal.Open(infile) as src, gdal.Open(outfile) as dst: + srcval = src.ReadAsArray().astype("float64") + expected = np.where(srcval > 128, srcval + 3, float("nan")) + + np.testing.assert_array_equal(expected, dst.ReadAsArray()) + assert src.GetGeoTransform() == dst.GetGeoTransform() + assert src.GetSpatialRef().IsSame(dst.GetSpatialRef()) + + +def test_gdalalg_raster_calc_creation_options(calc, tmp_vsimem): + + infile = "../gcore/data/byte.tif" + outfile = tmp_vsimem / "out.tif" + + calc["input"] = [infile] + calc["output"] = outfile + calc["creation-option"] = ["COMPRESS=LZW"] + calc["calc"] = ["X[1] + 3"] + + assert calc.Run() + + with gdal.Open(outfile) as dst: + assert dst.GetMetadata("IMAGE_STRUCTURE")["COMPRESSION"] == "LZW" + + +def test_gdalalg_raster_calc_output_format(calc, tmp_vsimem): + + infile = "../gcore/data/byte.tif" + outfile = tmp_vsimem / "out.unknown" + + calc["input"] = [infile] + calc["output"] = outfile + calc["output-format"] = "GTiff" + calc["calc"] = ["X + 3"] + + assert calc.Run() + + with gdal.Open(outfile) as dst: + assert dst.GetDriver().GetName() == "GTiff" + + +def test_gdalalg_raster_calc_overwrite(calc, tmp_vsimem): + + infile = "../gcore/data/byte.tif" + outfile = tmp_vsimem / "out.tif" + + gdal.CopyFile(infile, outfile) + + calc["input"] = [infile] + calc["output"] = outfile + calc["calc"] = ["X + 3"] + + with pytest.raises(Exception, match="already exists"): + assert not calc.Run() + + calc["overwrite"] = True + + assert calc.Run() + + +@pytest.mark.parametrize("expr", ("X + 3", "X[1] + 3")) +def test_gdalalg_raster_calc_basic_named_source(calc, tmp_vsimem, expr): + + np = pytest.importorskip("numpy") + + infile = "../gcore/data/byte.tif" + outfile = tmp_vsimem / "out.tif" + + calc["input"] = [f"X={infile}"] + calc["output"] = outfile + calc["calc"] = [expr] + + assert calc.Run() + + with gdal.Open(infile) as src, gdal.Open(outfile) as dst: + np.testing.assert_array_equal(src.ReadAsArray() + 3.0, dst.ReadAsArray()) + + +def test_gdalalg_raster_calc_multiple_calcs(calc, tmp_vsimem): + + np = pytest.importorskip("numpy") + + infile = "../gcore/data/byte.tif" + outfile = tmp_vsimem / "out.tif" + + calc["input"] = [infile] + calc["output"] = outfile + calc["calc"] = ["X + 3", "sqrt(X)"] + + assert calc.Run() + + with gdal.Open(infile) as src, gdal.Open(outfile) as dst: + src_dat = src.ReadAsArray() + dst_dat = dst.ReadAsArray() + + np.testing.assert_array_equal(src_dat + 3.0, dst_dat[0]) + np.testing.assert_array_equal(np.sqrt(src_dat.astype(np.float64)), dst_dat[1]) + + +@pytest.mark.parametrize( + "expr", + ( + "(A+B) / (A - B + 3)", + "A[2] + B", + ), +) +def test_gdalalg_raster_calc_multiple_inputs(calc, tmp_vsimem, expr): + + np = pytest.importorskip("numpy") + + # convert 1-based indices to 0-based indices to evaluate expression + # with numpy + numpy_expr = expr + for match in re.findall(r"(?<=\[)\d+(?=])", expr): + numpy_expr = re.sub(match, str(int(match) - 1), expr, count=1) + + nx = 3 + ny = 5 + nz = 2 + + input_1 = tmp_vsimem / "in1.tif" + input_2 = tmp_vsimem / "in2.tif" + outfile = tmp_vsimem / "out.tif" + + A = np.arange(nx * ny * nz, dtype=np.float32).reshape(nz, ny, nx) + B = np.sqrt(A) + + with gdal.GetDriverByName("GTiff").Create( + input_1, nx, ny, nz, eType=gdal.GDT_Float32 + ) as ds: + ds.WriteArray(A) + + with gdal.GetDriverByName("GTiff").Create( + input_2, nx, ny, nz, eType=gdal.GDT_Float32 + ) as ds: + ds.WriteArray(B) + + calc["input"] = [f"A={input_1}", f"B={input_2}"] + calc["output"] = outfile + calc["calc"] = [expr] + + assert calc.Run() + + with gdal.Open(outfile) as dst: + dat = dst.ReadAsArray() + np.testing.assert_allclose(dat, eval(numpy_expr), rtol=1e-6) + + +def test_gdalalg_raster_calc_inputs_from_file(calc, tmp_vsimem, tmp_path): + + np = pytest.importorskip("numpy") + + input_1 = tmp_vsimem / "in1.tif" + input_2 = tmp_vsimem / "in2.tif" + input_txt = tmp_path / "inputs.txt" + outfile = tmp_vsimem / "out.tif" + + with gdal.GetDriverByName("GTiff").Create(input_1, 2, 2) as ds: + ds.GetRasterBand(1).Fill(1) + + with gdal.GetDriverByName("GTIff").Create(input_2, 2, 2) as ds: + ds.GetRasterBand(1).Fill(2) + + with gdal.VSIFile(input_txt, "w") as txtfile: + txtfile.write(f"A={input_1}\n") + txtfile.write(f"B={input_2}\n") + + calc["input"] = [f"@{input_txt}"] + calc["output"] = outfile + calc["calc"] = ["A + B"] + + assert calc.Run() + + with gdal.Open(outfile) as dst: + assert np.all(dst.ReadAsArray() == 3) + + +def test_gdalalg_raster_calc_different_band_counts(calc, tmp_vsimem): + + np = pytest.importorskip("numpy") + + input_1 = tmp_vsimem / "in1.tif" + input_2 = tmp_vsimem / "in2.tif" + outfile = tmp_vsimem / "out.tif" + + with gdal.GetDriverByName("GTiff").Create(input_1, 2, 2, 2) as ds: + ds.GetRasterBand(1).Fill(1) + ds.GetRasterBand(2).Fill(2) + + with gdal.GetDriverByName("GTIff").Create(input_2, 2, 2, 3) as ds: + ds.GetRasterBand(1).Fill(3) + ds.GetRasterBand(2).Fill(4) + ds.GetRasterBand(3).Fill(5) + + calc["input"] = [f"A={input_1}", f"B={input_2}"] + calc["output"] = outfile + calc["calc"] = ["A[1] + A[2] + B[1] + B[2] + B[3]"] + + assert calc.Run() + + with gdal.Open(outfile) as dst: + assert np.all(dst.ReadAsArray() == (1 + 2 + 3 + 4 + 5)) + + +def test_gdalalg_calc_different_resolutions(calc, tmp_vsimem): + + np = pytest.importorskip("numpy") + + xmax = 60 + ymax = 60 + resolutions = [10, 20, 60] + + inputs = [tmp_vsimem / f"in_{i}.tif" for i in range(len(resolutions))] + outfile = tmp_vsimem / "out.tif" + + for res, fname in zip(resolutions, inputs): + with gdal.GetDriverByName("GTiff").Create( + fname, int(xmax / res), int(ymax / res), 1 + ) as ds: + ds.GetRasterBand(1).Fill(res) + ds.SetGeoTransform((0, res, 0, ymax, 0, -res)) + + calc["input"] = [f"A={inputs[0]}", f"B={inputs[1]}", f"C={inputs[2]}"] + calc["calc"] = ["A + B + C"] + calc["output"] = outfile + + calc["no-check-extent"] = True + with pytest.raises(Exception, match="Inputs do not have the same dimensions"): + calc.Run() + calc["no-check-extent"] = False + + assert calc.Run() + + with gdal.Open(outfile) as ds: + assert ds.RasterXSize == xmax / min(resolutions) + assert ds.RasterYSize == ymax / min(resolutions) + + assert np.all(ds.ReadAsArray() == sum(resolutions)) + + +def test_gdalalg_raster_calc_error_extent_mismatch(calc, tmp_vsimem): + + input_1 = tmp_vsimem / "in1.tif" + input_2 = tmp_vsimem / "in2.tif" + outfile = tmp_vsimem / "out.tif" + + with gdal.GetDriverByName("GTiff").Create(input_1, 2, 2) as ds: + ds.SetGeoTransform((0, 1, 0, 2, 0, -1)) + with gdal.GetDriverByName("GTIff").Create(input_2, 2, 2) as ds: + ds.SetGeoTransform((0, 2, 0, 4, 0, -2)) + + calc["input"] = [f"A={input_1}", f"B={input_2}"] + calc["output"] = outfile + calc["calc"] = ["A+B"] + + with pytest.raises(Exception, match="extents are inconsistent"): + calc.Run() + + calc["no-check-extent"] = True + assert calc.Run() + + with gdal.Open(input_1) as src, gdal.Open(outfile) as dst: + assert src.GetGeoTransform() == dst.GetGeoTransform() + + +def test_gdalalg_raster_calc_error_crs_mismatch(calc, tmp_vsimem): + + input_1 = tmp_vsimem / "in1.tif" + input_2 = tmp_vsimem / "in2.tif" + outfile = tmp_vsimem / "out.tif" + + with gdal.GetDriverByName("GTiff").Create(input_1, 2, 2) as ds: + ds.SetProjection("EPSG:4326") + with gdal.GetDriverByName("GTIff").Create(input_2, 2, 2) as ds: + ds.SetProjection("EPSG:4269") + + calc["input"] = [f"B={input_1}", f"A={input_2}"] + calc["output"] = outfile + calc["calc"] = ["A+B"] + + with pytest.raises(Exception, match="spatial reference systems are inconsistent"): + calc.Run() + + calc["no-check-srs"] = True + assert calc.Run() + + with gdal.Open(input_1) as src, gdal.Open(outfile) as dst: + assert src.GetSpatialRef().IsSame(dst.GetSpatialRef()) + + +@pytest.mark.parametrize("bands", [(2, 3), (2, 4)]) +def test_gdalalg_raster_calc_error_band_count_mismatch(calc, tmp_vsimem, bands): + + input_1 = tmp_vsimem / "in1.tif" + input_2 = tmp_vsimem / "in2.tif" + outfile = tmp_vsimem / "out.tif" + + gdal.GetDriverByName("GTiff").Create(input_1, 2, 2, bands[0]) + gdal.GetDriverByName("GTIff").Create(input_2, 2, 2, bands[1]) + + calc["input"] = [f"A={input_1}", f"B={input_2}"] + calc["output"] = outfile + calc["calc"] = ["A+B"] + + with pytest.raises(Exception, match="incompatible numbers of bands"): + calc.Run() + + calc["calc"] = ["A+B[1]"] + assert calc.Run() + + +@pytest.mark.parametrize( + "expr,source,bands,expected", + [ + ("aX + 2", "aX", 1, ["aX[1] + 2"]), + ("aX + 2", "aX", 2, ["aX[1] + 2", "aX[2] + 2"]), + ("aX + 2", "X", 1, ["aX + 2"]), + ("aX + 2", "a", 1, ["aX + 2"]), + ("2 + aX", "X", 1, ["2 + aX"]), + ("2 + aX", "aX", 1, ["2 + aX[1]"]), + ("B1 + B10", "B1", 1, ["B1[1] + B10"]), + ("B1[1] + B10", "B1", 2, ["B1[1] + B10"]), + ("B1[1] + B1", "B1", 2, ["B1[1] + B1[1]", "B1[1] + B1[2]"]), + ("SIN(N) + N", "N", 1, ["SIN(N[1]) + N[1]"]), + ("SUM(N,N2) + N", "N", 1, ["SUM(N[1],N2) + N[1]"]), + ("SUM(N,N2) + N", "N2", 1, ["SUM(N,N2[1]) + N"]), + ("A_X + X", "X", 1, ["A_X + X[1]"]), + ], +) +def test_gdalalg_raster_calc_expression_rewriting( + calc, tmp_vsimem, expr, source, bands, expected +): + # The expression rewriting isn't exposed to Python, so we + # create an VRT with an expression and a single source, and + # inspect the transformed expression in the VRT XML. + # The transformed expression need not be valid, because we + # don't actually read the VRT in GDAL. + + import xml.etree.ElementTree as ET + + outfile = tmp_vsimem / "out.vrt" + infile = tmp_vsimem / "input.tif" + + gdal.GetDriverByName("GTiff").Create(infile, 2, 2, bands) + + calc["input"] = [f"{source}={infile}"] + calc["output"] = outfile + calc["calc"] = [expr] + + assert calc.Run() + + with gdal.VSIFile(outfile, "r") as f: + root = ET.fromstring(f.read()) + + expr = [ + node.attrib["expression"] for node in root.findall(".//PixelFunctionArguments") + ] + assert expr == expected diff --git a/doc/source/programs/gdal_raster.rst b/doc/source/programs/gdal_raster.rst index 4f6190896d98..bcc331dce415 100644 --- a/doc/source/programs/gdal_raster.rst +++ b/doc/source/programs/gdal_raster.rst @@ -19,6 +19,7 @@ Synopsis Usage: gdal raster where is one of: + - calc: Perform raster algebra. - clip: Clip a raster dataset. - convert: Convert a raster dataset. - edit: Edit a raster dataset. @@ -34,6 +35,7 @@ Available sub-commands ---------------------- - :ref:`gdal_raster_info_subcommand` +- :ref:`gdal_raster_calc_subcommand` - :ref:`gdal_raster_clip_subcommand` - :ref:`gdal_raster_convert_subcommand` - :ref:`gdal_raster_mosaic_subcommand` diff --git a/doc/source/programs/gdal_raster_calc.rst b/doc/source/programs/gdal_raster_calc.rst new file mode 100644 index 000000000000..0d1b8c6092cb --- /dev/null +++ b/doc/source/programs/gdal_raster_calc.rst @@ -0,0 +1,104 @@ +.. _gdal_raster_calc_subcommand: + +================================================================================ +"gdal raster calc" sub-command +================================================================================ + +.. versionadded:: 3.11 + +.. only:: html + + Perform raster algebra + +.. Index:: gdal raster calc + +Synopsis +-------- + +.. program-output:: gdal raster calc --help + :ellipsis: -5 + + +Description +----------- + +:program:`gdal raster calc` performs pixel-wise calculations on one or more input GDAL datasets. Calculations +can be performed eagerly, writing results to a conventional raster format, +or lazily, written as a set of derived bands in a :ref:`VRT (Virtual Dataset) `. + +The list of input GDAL datasets can be specified at the end +of the command line or put in a text file (one input per line) for very long lists. +If more than one input dataset is used, it should be prefixed with a name by which it +will be referenced in the calculation, e.g. ``A=my_data.tif``. (If a single dataset is +used, it will be referred to with the variable ``X`` in formulas.) + +The inputs should have the same spatial reference system and should cover the same spatial extent but are not required to have the same +spatial resolution. The spatial extent check can be disabled with :option:`--no-check-extent`, +in which case the inputs must have the same dimensions. The spatial reference system check can be +disabled with :option:`--no-check-srs`. + +The following options are available: + +.. include:: gdal_options/of_raster_create_copy.rst + +.. include:: gdal_options/co.rst + +.. include:: gdal_options/overwrite.rst + +.. option:: -i [=] + + Select an input dataset to be processed. If more than one input dataset is provided, + each dataset must be prefixed with a name to which it will will be referenced in :option:`--calc`. + +.. option:: --calc + + An expression to be evaluated using the `muparser `__ math parser library. + The expression may refer to individual bands of each input (e.g., ``X[1] + 3``) or it may be applied to all bands + of an input (``X + 3``). If the expression contains a reference to all bands of multiple inputs, those inputs + must either have the same the number of bands, or a single band. + + For example, if inputs ``A`` and ``B`` each have three bands, and input ``C`` has a single band, then the argument + ``--calc "A + B + C"`` is equivalent to ``--calc "A[1] + B[1] + C[1]" --calc "A[2] + B[2] + C[1]" --calc "A[3] + B[3] + C[1]"``. + + Multiple calculations may be specified; output band(s) will be produced for each expression in the order they + are provided. + + Input rasters will be converted to 64-bit floating point numbers before performing calculations. + +.. option:: --no-check-extent + + Do not verify that the input rasters have the same spatial extent. The input rasters will instead be required to + have the same dimensions. The geotransform of the first input will be assigned to the output. + +.. option:: --no-check-srs + + Do not check the spatial reference systems of the inputs for consistency. All inputs will be assumed to have the + spatial reference system of the first input, and this spatial reference system will be used for the output. + +Examples +-------- + +.. example:: + :title: Per-band sum of three files + :id: simple-sum + + .. code-block:: bash + + gdal raster calc -i "A=file1.tif" -i "B=file2.tif" -i "C=file3.tif" --calc "A+B+C" -o out.tif + + +.. example:: + :title: Per-band maximum of three files + :id: simple-max + + .. code-block:: bash + + gdal raster calc -i "A=file1.tif" -i "B=file2.tif" -i "C=file3.tif" --calc "max(A,B,C)" -o out.tif + + +.. example:: + :title: Setting values of zero and below to NaN + + .. code-block:: bash + + gdal_calc -i "A=input.tif" -o=result.tif --calc="A > 0 ? A : NaN" diff --git a/doc/source/programs/index.rst b/doc/source/programs/index.rst index 23afc8cb9aab..7a7927d3a6cb 100644 --- a/doc/source/programs/index.rst +++ b/doc/source/programs/index.rst @@ -32,6 +32,7 @@ single :program:`gdal` program that accepts commands and subcommands. gdal_convert gdal_raster gdal_raster_info + gdal_raster_calc gdal_raster_clip gdal_raster_convert gdal_raster_edit @@ -60,6 +61,7 @@ single :program:`gdal` program that accepts commands and subcommands. - :ref:`gdal_convert_command`: Convert a dataset - :ref:`gdal_raster_command`: Entry point for raster commands - :ref:`gdal_raster_info_subcommand`: Get information on a raster dataset + - :ref:`gdal_raster_calc_subcommand`: Perform raster algebra - :ref:`gdal_raster_clip_subcommand`: Clip a raster dataset - :ref:`gdal_raster_convert_subcommand`: Convert a raster dataset - :ref:`gdal_raster_edit_subcommand`: Edit in place a raster dataset diff --git a/frmts/vrt/vrtexpression_muparser.cpp b/frmts/vrt/vrtexpression_muparser.cpp index d9e747302c21..3910db4573dd 100644 --- a/frmts/vrt/vrtexpression_muparser.cpp +++ b/frmts/vrt/vrtexpression_muparser.cpp @@ -13,19 +13,65 @@ #include "vrtexpression.h" #include "cpl_string.h" +#include #include +#include #include namespace gdal { /*! @cond Doxygen_Suppress */ + +static std::optional Sanitize(const std::string &osVariable) +{ + // muparser does not allow characters '[' or ']' which we use to emulate + // vectors. Replace these with a combination of underscores + auto from = osVariable.find('['); + if (from != std::string::npos) + { + auto to = osVariable.find(']'); + if (to != std::string::npos) + { + auto sanitized = std::string("__") + osVariable.substr(0, from) + + +"__" + + osVariable.substr(from + 1, to - from - 1) + "__"; + return sanitized; + } + } + + return std::nullopt; +} + +static void ReplaceVariable(std::string &expression, + const std::string &variable, + const std::string &sanitized) +{ + std::string::size_type seekPos = 0; + auto pos = expression.find(variable, seekPos); + while (pos != std::string::npos) + { + auto end = pos + variable.size(); + + if (pos == 0 || + (!std::isalnum(expression[pos - 1]) && expression[pos - 1] != '_')) + { + expression = + expression.substr(0, pos) + sanitized + expression.substr(end); + } + + seekPos = end; + pos = expression.find(variable, seekPos); + } +} + class MuParserExpression::Impl { public: explicit Impl(std::string_view osExpression) - : m_osExpression(std::string(osExpression)), m_oVectors{}, m_oParser{}, - m_adfResults{1}, m_bIsCompiled{false}, m_bCompileFailed{false} + : m_osExpression(std::string(osExpression)), m_oSubstitutions{}, + m_oParser{}, m_adfResults{1}, m_bIsCompiled{false}, m_bCompileFailed{ + false} { } @@ -50,13 +96,26 @@ class MuParserExpression::Impl return CE_Failure; } + // On some platforms muparser does not seem to parse "nan" as a floating + // point literal. try { - CPLString tmpExpression(m_osExpression); + m_oParser.DefineConst("nan", + std::numeric_limits::quiet_NaN()); + m_oParser.DefineConst("NaN", + std::numeric_limits::quiet_NaN()); + } + catch (const mu::Parser::exception_type &) + { + } + + try + { + std::string tmpExpression(m_osExpression); - for (const auto &[osVec, osElems] : m_oVectors) + for (const auto &[osFrom, osTo] : m_oSubstitutions) { - tmpExpression.replaceAll(osVec, osElems); + ReplaceVariable(tmpExpression, osFrom, osTo); } m_oParser.SetExpr(tmpExpression); @@ -108,8 +167,8 @@ class MuParserExpression::Impl return CE_None; } - CPLString m_osExpression; - std::map m_oVectors; + const CPLString m_osExpression; + std::map m_oSubstitutions; mu::Parser m_oParser; std::vector m_adfResults; bool m_bIsCompiled; @@ -134,7 +193,12 @@ CPLErr MuParserExpression::Compile() void MuParserExpression::RegisterVariable(std::string_view osVariable, double *pdfValue) { - m_pImpl->Register(osVariable, pdfValue); + auto sanitized = Sanitize(std::string(osVariable)); + if (sanitized.has_value()) + { + m_pImpl->m_oSubstitutions[std::string(osVariable)] = sanitized.value(); + } + m_pImpl->Register(sanitized.value_or(std::string(osVariable)), pdfValue); } void MuParserExpression::RegisterVector(std::string_view osVariable, @@ -155,8 +219,9 @@ void MuParserExpression::RegisterVector(std::string_view osVariable, for (std::size_t i = 0; i < padfValues->size(); i++) { - osElementVarName.Printf("__%s_%d", osVectorVarName.c_str(), + osElementVarName.Printf("%s[%d]", osVectorVarName.c_str(), static_cast(i)); + osElementVarName = Sanitize(osElementVarName).value(); RegisterVariable(osElementVarName, padfValues->data() + i); if (i > 0) @@ -166,7 +231,7 @@ void MuParserExpression::RegisterVector(std::string_view osVariable, osElementsList += osElementVarName; } - m_pImpl->m_oVectors[std::string(osVariable)] = osElementsList; + m_pImpl->m_oSubstitutions[std::string(osVariable)] = osElementsList; } CPLErr MuParserExpression::Evaluate() diff --git a/frmts/vrt/vrtsources.cpp b/frmts/vrt/vrtsources.cpp index c16b085b950e..64bd38932d5f 100644 --- a/frmts/vrt/vrtsources.cpp +++ b/frmts/vrt/vrtsources.cpp @@ -489,6 +489,11 @@ CPLXMLNode *VRTSimpleSource::SerializeToXML(const char *pszVRTPath) CXT_Text, m_osResampling.c_str()); } + if (!m_osName.empty()) + { + CPLAddXMLAttributeAndValue(psSrc, "name", m_osName); + } + if (m_bSrcDSNameFromVRT) { CPLAddXMLChild(psSrc, CPLParseXMLString(m_osSrcDSName.c_str())); diff --git a/gcore/gdalalgorithm.h b/gcore/gdalalgorithm.h index 2853d23bb350..9a0788c9822d 100644 --- a/gcore/gdalalgorithm.h +++ b/gcore/gdalalgorithm.h @@ -423,7 +423,7 @@ class CPL_DLL GDALArgDatasetValue final /** Set dataset name */ void Set(const std::string &name); - /** Transfer dataset to this instance (does not affect is reference + /** Transfer dataset to this instance (does not affect its reference * counter). */ void Set(std::unique_ptr poDS); diff --git a/swig/include/python/gdal_python.i b/swig/include/python/gdal_python.i index db9a0ac37dcb..60d628c62723 100644 --- a/swig/include/python/gdal_python.i +++ b/swig/include/python/gdal_python.i @@ -5365,6 +5365,10 @@ class VSIFile(BytesIO): raise Exception("Unhandled algorithm argument data type") def Set(self, value): + import os + if isinstance(value, os.PathLike): + value = str(value) + type = self.GetType() if type == GAAT_BOOLEAN: return self.SetAsBoolean(value) From 2768934ab7beeadc23d17d18f7464206ed9544bc Mon Sep 17 00:00:00 2001 From: Even Rouault Date: Wed, 12 Feb 2025 00:16:57 +0100 Subject: [PATCH 7/9] gdal vector: make 'read', 'clip' and 'reproject' compatible of OSM-type of datasources that require ODsCRandomLayerRead On-the-fly reading of OSM requires to be able to iterate over features at the dataset level, and not just at the layer level. Let's implement that. --- apps/gdalalg_vector_clip.cpp | 147 ++++++--------- apps/gdalalg_vector_pipeline.cpp | 171 ++++++++++++++++++ apps/gdalalg_vector_pipeline.h | 77 ++++++-- apps/gdalalg_vector_read.cpp | 121 ++++++++++++- apps/gdalalg_vector_reproject.cpp | 12 +- apps/gdalalg_vector_select.cpp | 14 +- apps/gdalalg_vector_write.cpp | 6 + .../utilities/test_gdalalg_vector_clip.py | 34 ++++ .../utilities/test_gdalalg_vector_pipeline.py | 81 ++++++++- .../test_gdalalg_vector_reproject.py | 57 ++++++ ogr/ogrsf_frmts/generic/CMakeLists.txt | 1 + ogr/ogrsf_frmts/generic/ogrlayerdecorator.h | 2 +- .../generic/ogrlayerwithtranslatefeature.cpp | 19 ++ .../generic/ogrlayerwithtranslatefeature.h | 36 ++++ .../generic/ogrmutexeddatasource.cpp | 2 +- ogr/ogrsf_frmts/generic/ogrwarpedlayer.cpp | 12 ++ ogr/ogrsf_frmts/generic/ogrwarpedlayer.h | 19 +- 17 files changed, 686 insertions(+), 125 deletions(-) create mode 100755 autotest/utilities/test_gdalalg_vector_reproject.py create mode 100644 ogr/ogrsf_frmts/generic/ogrlayerwithtranslatefeature.cpp create mode 100644 ogr/ogrsf_frmts/generic/ogrlayerwithtranslatefeature.h diff --git a/apps/gdalalg_vector_clip.cpp b/apps/gdalalg_vector_clip.cpp index ed5e9e714426..b63ad9604ebb 100644 --- a/apps/gdalalg_vector_clip.cpp +++ b/apps/gdalalg_vector_clip.cpp @@ -65,129 +65,99 @@ GDALVectorClipAlgorithm::GDALVectorClipAlgorithm(bool standaloneStep) namespace { -class GDALVectorClipAlgorithmLayer final - : public OGRLayer, - public OGRGetNextFeatureThroughRaw +class GDALVectorClipAlgorithmLayer final : public GDALVectorPipelineOutputLayer { - - DEFINE_GET_NEXT_FEATURE_THROUGH_RAW(GDALVectorClipAlgorithmLayer) - public: - GDALVectorClipAlgorithmLayer(OGRLayer *poSrcLayer, + GDALVectorClipAlgorithmLayer(OGRLayer &oSrcLayer, std::unique_ptr poClipGeom) - : m_poSrcLayer(poSrcLayer), m_poClipGeom(std::move(poClipGeom)), - m_eSrcLayerGeomType(m_poSrcLayer->GetGeomType()), + : GDALVectorPipelineOutputLayer(oSrcLayer), + m_poClipGeom(std::move(poClipGeom)), + m_eSrcLayerGeomType(oSrcLayer.GetGeomType()), m_eFlattenSrcLayerGeomType(wkbFlatten(m_eSrcLayerGeomType)), m_bSrcLayerGeomTypeIsCollection(OGR_GT_IsSubClassOf( m_eFlattenSrcLayerGeomType, wkbGeometryCollection)) { - SetDescription(poSrcLayer->GetDescription()); - poSrcLayer->SetSpatialFilter(m_poClipGeom.get()); + SetDescription(oSrcLayer.GetDescription()); + oSrcLayer.SetSpatialFilter(m_poClipGeom.get()); } OGRFeatureDefn *GetLayerDefn() override { - return m_poSrcLayer->GetLayerDefn(); - } - - void ResetReading() override - { - m_poSrcLayer->ResetReading(); - m_poSrcFeature.reset(); - m_poCurGeomColl.reset(); - m_idxInCurGeomColl = 0; + return m_srcLayer.GetLayerDefn(); } - OGRFeature *GetNextRawFeature() + void TranslateFeature( + std::unique_ptr poSrcFeature, + std::vector> &apoOutFeatures) override { - if (m_poSrcFeature && m_poCurGeomColl) + auto poGeom = poSrcFeature->GetGeometryRef(); + if (!poGeom) + return; + + auto poIntersection = std::unique_ptr( + poGeom->Intersection(m_poClipGeom.get())); + if (!poIntersection) + return; + + const auto eFeatGeomType = + wkbFlatten(poIntersection->getGeometryType()); + if (m_eFlattenSrcLayerGeomType != wkbUnknown && + m_eFlattenSrcLayerGeomType != eFeatGeomType) { - while (m_idxInCurGeomColl < m_poCurGeomColl->getNumGeometries()) + // If the intersection is a collection of geometry and the + // layer geometry type is of non-collection type, create + // one feature per element of the collection. + if (!m_bSrcLayerGeomTypeIsCollection && + OGR_GT_IsSubClassOf(eFeatGeomType, wkbGeometryCollection)) { - const auto poGeom = - m_poCurGeomColl->getGeometryRef(m_idxInCurGeomColl); - ++m_idxInCurGeomColl; - if (m_eFlattenSrcLayerGeomType == wkbUnknown || - m_eFlattenSrcLayerGeomType == - wkbFlatten(poGeom->getGeometryType())) + auto poGeomColl = std::unique_ptr( + poIntersection.release()->toGeometryCollection()); + for (const auto *poSubGeom : poGeomColl.get()) { auto poDstFeature = - std::unique_ptr(m_poSrcFeature->Clone()); - poDstFeature->SetGeometry(poGeom); - return poDstFeature.release(); + std::unique_ptr(poSrcFeature->Clone()); + poDstFeature->SetGeometry(poSubGeom); + apoOutFeatures.push_back(std::move(poDstFeature)); } } - m_poSrcFeature.reset(); - m_poCurGeomColl.reset(); - m_idxInCurGeomColl = 0; - } - - while (auto poFeature = - std::unique_ptr(m_poSrcLayer->GetNextFeature())) - { - auto poGeom = poFeature->GetGeometryRef(); - if (!poGeom) - continue; - - auto poIntersection = std::unique_ptr( - poGeom->Intersection(m_poClipGeom.get())); - if (!poIntersection) - continue; - - const auto eFeatGeomType = - wkbFlatten(poIntersection->getGeometryType()); - if (m_eFlattenSrcLayerGeomType != wkbUnknown && - m_eFlattenSrcLayerGeomType != eFeatGeomType) + else if (OGR_GT_GetCollection(eFeatGeomType) == + m_eFlattenSrcLayerGeomType) { - // If the intersection is a collection of geometry and the - // layer geometry type is of non-collection type, create - // one feature per element of the collection. - if (!m_bSrcLayerGeomTypeIsCollection && - OGR_GT_IsSubClassOf(eFeatGeomType, wkbGeometryCollection)) - { - m_poSrcFeature = std::move(poFeature); - m_poCurGeomColl.reset( - poIntersection.release()->toGeometryCollection()); - m_idxInCurGeomColl = 0; - return GetNextFeature(); - } - else if (OGR_GT_GetCollection(eFeatGeomType) == - m_eFlattenSrcLayerGeomType) - { - poIntersection.reset(OGRGeometryFactory::forceTo( - poIntersection.release(), m_eSrcLayerGeomType)); - poFeature->SetGeometryDirectly(poIntersection.release()); - return poFeature.release(); - } - // else discard geometries of incompatible type with the - // layer geometry type + poIntersection.reset(OGRGeometryFactory::forceTo( + poIntersection.release(), m_eSrcLayerGeomType)); + poSrcFeature->SetGeometryDirectly(poIntersection.release()); + apoOutFeatures.push_back(std::move(poSrcFeature)); } - else + else if (m_eFlattenSrcLayerGeomType == wkbGeometryCollection) { - poFeature->SetGeometryDirectly(poIntersection.release()); - return poFeature.release(); + auto poGeomColl = std::make_unique(); + poGeomColl->addGeometry(std::move(poIntersection)); + poSrcFeature->SetGeometryDirectly(poGeomColl.release()); + apoOutFeatures.push_back(std::move(poSrcFeature)); } + // else discard geometries of incompatible type with the + // layer geometry type + } + else + { + poSrcFeature->SetGeometryDirectly(poIntersection.release()); + apoOutFeatures.push_back(std::move(poSrcFeature)); } - return nullptr; } int TestCapability(const char *pszCap) override { if (EQUAL(pszCap, OLCStringsAsUTF8) || EQUAL(pszCap, OLCCurveGeometries) || EQUAL(pszCap, OLCZGeometries)) - return m_poSrcLayer->TestCapability(pszCap); + return m_srcLayer.TestCapability(pszCap); return false; } private: - OGRLayer *m_poSrcLayer = nullptr; std::unique_ptr m_poClipGeom{}; const OGRwkbGeometryType m_eSrcLayerGeomType; const OGRwkbGeometryType m_eFlattenSrcLayerGeomType; const bool m_bSrcLayerGeomTypeIsCollection; - std::unique_ptr m_poSrcFeature{}; - std::unique_ptr m_poCurGeomColl{}; - int m_idxInCurGeomColl = 0; CPL_DISALLOW_COPY_ASSIGN(GDALVectorClipAlgorithmLayer) }; @@ -428,8 +398,7 @@ bool GDALVectorClipAlgorithm::RunStep(GDALProgressFunc, void *) return false; } - auto outDS = std::make_unique(); - outDS->SetDescription(poSrcDS->GetDescription()); + auto outDS = std::make_unique(*poSrcDS); bool ret = true; for (int i = 0; ret && i < nLayerCount; ++i) @@ -448,8 +417,10 @@ bool GDALVectorClipAlgorithm::RunStep(GDALProgressFunc, void *) } if (ret) { - outDS->AddLayer(std::make_unique( - poSrcLayer, std::move(poClipGeomForLayer))); + outDS->AddLayer( + *poSrcLayer, + std::make_unique( + *poSrcLayer, std::move(poClipGeomForLayer))); } } } diff --git a/apps/gdalalg_vector_pipeline.cpp b/apps/gdalalg_vector_pipeline.cpp index cade33a94b40..f7a639c36b94 100644 --- a/apps/gdalalg_vector_pipeline.cpp +++ b/apps/gdalalg_vector_pipeline.cpp @@ -516,4 +516,175 @@ std::string GDALVectorPipelineAlgorithm::GetUsageForCLI( return ret; } +/************************************************************************/ +/* GDALVectorPipelineOutputLayer */ +/************************************************************************/ + +/************************************************************************/ +/* GDALVectorPipelineOutputLayer() */ +/************************************************************************/ + +GDALVectorPipelineOutputLayer::GDALVectorPipelineOutputLayer(OGRLayer &srcLayer) + : m_srcLayer(srcLayer) +{ +} + +/************************************************************************/ +/* GDALVectorPipelineOutputLayer::ResetReading() */ +/************************************************************************/ + +void GDALVectorPipelineOutputLayer::ResetReading() +{ + m_srcLayer.ResetReading(); + m_pendingFeatures.clear(); + m_idxInPendingFeatures = 0; +} + +/************************************************************************/ +/* GDALVectorPipelineOutputLayer::GetNextRawFeature() */ +/************************************************************************/ + +OGRFeature *GDALVectorPipelineOutputLayer::GetNextRawFeature() +{ + if (m_idxInPendingFeatures < m_pendingFeatures.size()) + { + OGRFeature *poFeature = + m_pendingFeatures[m_idxInPendingFeatures].release(); + ++m_idxInPendingFeatures; + return poFeature; + } + m_pendingFeatures.clear(); + m_idxInPendingFeatures = 0; + while (true) + { + auto poSrcFeature = + std::unique_ptr(m_srcLayer.GetNextFeature()); + if (!poSrcFeature) + return nullptr; + TranslateFeature(std::move(poSrcFeature), m_pendingFeatures); + if (!m_pendingFeatures.empty()) + break; + } + OGRFeature *poFeature = m_pendingFeatures[0].release(); + m_idxInPendingFeatures = 1; + return poFeature; +} + +/************************************************************************/ +/* GDALVectorPipelineOutputDataset */ +/************************************************************************/ + +/************************************************************************/ +/* GDALVectorPipelineOutputDataset() */ +/************************************************************************/ + +GDALVectorPipelineOutputDataset::GDALVectorPipelineOutputDataset( + GDALDataset &srcDS) + : m_srcDS(srcDS) +{ + SetDescription(m_srcDS.GetDescription()); +} + +/************************************************************************/ +/* GDALVectorPipelineOutputDataset::AddLayer() */ +/************************************************************************/ + +void GDALVectorPipelineOutputDataset::AddLayer( + OGRLayer &oSrcLayer, + std::unique_ptr poNewLayer) +{ + m_layersToDestroy.push_back(std::move(poNewLayer)); + OGRLayerWithTranslateFeature *poNewLayerRaw = + m_layersToDestroy.back().get(); + m_layers.push_back(poNewLayerRaw); + m_mapSrcLayerToNewLayer[&oSrcLayer] = poNewLayerRaw; +} + +/************************************************************************/ +/* GDALVectorPipelineOutputDataset::GetLayerCount() */ +/************************************************************************/ + +int GDALVectorPipelineOutputDataset::GetLayerCount() +{ + return static_cast(m_layers.size()); +} + +/************************************************************************/ +/* GDALVectorPipelineOutputDataset::GetLayer() */ +/************************************************************************/ + +OGRLayer *GDALVectorPipelineOutputDataset::GetLayer(int idx) +{ + return idx >= 0 && idx < GetLayerCount() ? m_layers[idx] : nullptr; +} + +/************************************************************************/ +/* GDALVectorPipelineOutputDataset::TestCapability() */ +/************************************************************************/ + +int GDALVectorPipelineOutputDataset::TestCapability(const char *pszCap) +{ + if (EQUAL(pszCap, ODsCRandomLayerRead)) + { + return m_srcDS.TestCapability(pszCap); + } + return false; +} + +/************************************************************************/ +/* GDALVectorPipelineOutputDataset::ResetReading() */ +/************************************************************************/ + +void GDALVectorPipelineOutputDataset::ResetReading() +{ + m_srcDS.ResetReading(); + m_pendingFeatures.clear(); + m_idxInPendingFeatures = 0; +} + +/************************************************************************/ +/* GDALVectorPipelineOutputDataset::GetNextFeature() */ +/************************************************************************/ + +OGRFeature *GDALVectorPipelineOutputDataset::GetNextFeature( + OGRLayer **ppoBelongingLayer, double *pdfProgressPct, + GDALProgressFunc pfnProgress, void *pProgressData) +{ + if (m_idxInPendingFeatures < m_pendingFeatures.size()) + { + OGRFeature *poFeature = + m_pendingFeatures[m_idxInPendingFeatures].release(); + if (ppoBelongingLayer) + *ppoBelongingLayer = m_belongingLayer; + ++m_idxInPendingFeatures; + return poFeature; + } + + m_pendingFeatures.clear(); + m_idxInPendingFeatures = 0; + + while (true) + { + OGRLayer *poSrcBelongingLayer = nullptr; + auto poSrcFeature = std::unique_ptr(m_srcDS.GetNextFeature( + &poSrcBelongingLayer, pdfProgressPct, pfnProgress, pProgressData)); + if (!poSrcFeature) + return nullptr; + auto iterToDstLayer = m_mapSrcLayerToNewLayer.find(poSrcBelongingLayer); + if (iterToDstLayer != m_mapSrcLayerToNewLayer.end()) + { + m_belongingLayer = iterToDstLayer->second; + m_belongingLayer->TranslateFeature(std::move(poSrcFeature), + m_pendingFeatures); + if (!m_pendingFeatures.empty()) + break; + } + } + OGRFeature *poFeature = m_pendingFeatures[0].release(); + if (ppoBelongingLayer) + *ppoBelongingLayer = m_belongingLayer; + m_idxInPendingFeatures = 1; + return poFeature; +} + //! @endcond diff --git a/apps/gdalalg_vector_pipeline.h b/apps/gdalalg_vector_pipeline.h index 4bf66820e0f0..8bbf6f249f4c 100644 --- a/apps/gdalalg_vector_pipeline.h +++ b/apps/gdalalg_vector_pipeline.h @@ -17,6 +17,10 @@ #include "gdalalg_abstract_pipeline.h" #include "ogrsf_frmts.h" +#include "ogrlayerwithtranslatefeature.h" + +#include +#include //! @cond Doxygen_Suppress @@ -108,6 +112,34 @@ class GDALVectorPipelineAlgorithm final } }; +/************************************************************************/ +/* GDALVectorPipelineOutputLayer */ +/************************************************************************/ + +/** Class that implements GetNextFeature() by forwarding to + * OGRLayerWithTranslateFeature::TranslateFeature() implementation, which + * might return several features. + */ +class GDALVectorPipelineOutputLayer /* non final */ + : public OGRLayerWithTranslateFeature, + public OGRGetNextFeatureThroughRaw +{ + protected: + explicit GDALVectorPipelineOutputLayer(OGRLayer &oSrcLayer); + + DEFINE_GET_NEXT_FEATURE_THROUGH_RAW(GDALVectorPipelineOutputLayer) + + OGRLayer &m_srcLayer; + + public: + void ResetReading() override; + OGRFeature *GetNextRawFeature(); + + private: + std::vector> m_pendingFeatures{}; + size_t m_idxInPendingFeatures = 0; +}; + /************************************************************************/ /* GDALVectorPipelineOutputDataset */ /************************************************************************/ @@ -117,32 +149,37 @@ class GDALVectorPipelineAlgorithm final */ class GDALVectorPipelineOutputDataset final : public GDALDataset { - std::vector> m_layersToDestroy{}; - std::vector m_layers{}; + GDALDataset &m_srcDS; + std::map + m_mapSrcLayerToNewLayer{}; + std::vector> + m_layersToDestroy{}; + std::vector m_layers{}; + + OGRLayerWithTranslateFeature *m_belongingLayer = nullptr; + std::vector> m_pendingFeatures{}; + size_t m_idxInPendingFeatures = 0; + + CPL_DISALLOW_COPY_ASSIGN(GDALVectorPipelineOutputDataset) public: - GDALVectorPipelineOutputDataset() = default; + explicit GDALVectorPipelineOutputDataset(GDALDataset &oSrcDS); - void AddLayer(std::unique_ptr poLayer) - { - m_layersToDestroy.push_back(std::move(poLayer)); - m_layers.push_back(m_layersToDestroy.back().get()); - } + void AddLayer(OGRLayer &oSrcLayer, + std::unique_ptr poNewLayer); - void AddLayer(OGRLayer *poLayer) - { - m_layers.push_back(poLayer); - } + int GetLayerCount() override; - int GetLayerCount() override - { - return static_cast(m_layers.size()); - } + OGRLayer *GetLayer(int idx) override; - OGRLayer *GetLayer(int idx) override - { - return idx >= 0 && idx < GetLayerCount() ? m_layers[idx] : nullptr; - } + int TestCapability(const char *pszCap) override; + + void ResetReading() override; + + OGRFeature *GetNextFeature(OGRLayer **ppoBelongingLayer, + double *pdfProgressPct, + GDALProgressFunc pfnProgress, + void *pProgressData) override; }; //! @endcond diff --git a/apps/gdalalg_vector_read.cpp b/apps/gdalalg_vector_read.cpp index 4af6c5e15d6e..a7d4aeae69c3 100644 --- a/apps/gdalalg_vector_read.cpp +++ b/apps/gdalalg_vector_read.cpp @@ -32,6 +32,121 @@ GDALVectorReadAlgorithm::GDALVectorReadAlgorithm() AddInputArgs(/* hiddenForCLI = */ false); } +/************************************************************************/ +/* GDALVectorPipelineReadOutputDataset */ +/************************************************************************/ + +/** Class used by vector pipeline steps to create an output on-the-fly + * dataset where they can store on-the-fly layers. + */ +class GDALVectorPipelineReadOutputDataset final : public GDALDataset +{ + GDALDataset &m_srcDS; + std::vector m_layers{}; + + CPL_DISALLOW_COPY_ASSIGN(GDALVectorPipelineReadOutputDataset) + + public: + explicit GDALVectorPipelineReadOutputDataset(GDALDataset &oSrcDS); + + void AddLayer(OGRLayer &oSrcLayer); + + int GetLayerCount() override; + + OGRLayer *GetLayer(int idx) override; + + int TestCapability(const char *pszCap) override; + + void ResetReading() override; + + OGRFeature *GetNextFeature(OGRLayer **ppoBelongingLayer, + double *pdfProgressPct, + GDALProgressFunc pfnProgress, + void *pProgressData) override; +}; + +/************************************************************************/ +/* GDALVectorPipelineReadOutputDataset() */ +/************************************************************************/ + +GDALVectorPipelineReadOutputDataset::GDALVectorPipelineReadOutputDataset( + GDALDataset &srcDS) + : m_srcDS(srcDS) +{ + SetDescription(m_srcDS.GetDescription()); +} + +/************************************************************************/ +/* GDALVectorPipelineReadOutputDataset::AddLayer() */ +/************************************************************************/ + +void GDALVectorPipelineReadOutputDataset::AddLayer(OGRLayer &oSrcLayer) +{ + m_layers.push_back(&oSrcLayer); +} + +/************************************************************************/ +/* GDALVectorPipelineReadOutputDataset::GetLayerCount() */ +/************************************************************************/ + +int GDALVectorPipelineReadOutputDataset::GetLayerCount() +{ + return static_cast(m_layers.size()); +} + +/************************************************************************/ +/* GDALVectorPipelineReadOutputDataset::GetLayer() */ +/************************************************************************/ + +OGRLayer *GDALVectorPipelineReadOutputDataset::GetLayer(int idx) +{ + return idx >= 0 && idx < GetLayerCount() ? m_layers[idx] : nullptr; +} + +/************************************************************************/ +/* GDALVectorPipelineReadOutputDataset::TestCapability() */ +/************************************************************************/ + +int GDALVectorPipelineReadOutputDataset::TestCapability(const char *pszCap) +{ + if (EQUAL(pszCap, ODsCRandomLayerRead)) + return m_srcDS.TestCapability(pszCap); + return false; +} + +/************************************************************************/ +/* GDALVectorPipelineReadOutputDataset::ResetReading() */ +/************************************************************************/ + +void GDALVectorPipelineReadOutputDataset::ResetReading() +{ + m_srcDS.ResetReading(); +} + +/************************************************************************/ +/* GDALVectorPipelineReadOutputDataset::GetNextFeature() */ +/************************************************************************/ + +OGRFeature *GDALVectorPipelineReadOutputDataset::GetNextFeature( + OGRLayer **ppoBelongingLayer, double *pdfProgressPct, + GDALProgressFunc pfnProgress, void *pProgressData) +{ + while (true) + { + OGRLayer *poBelongingLayer = nullptr; + auto poFeature = std::unique_ptr(m_srcDS.GetNextFeature( + &poBelongingLayer, pdfProgressPct, pfnProgress, pProgressData)); + if (ppoBelongingLayer) + *ppoBelongingLayer = poBelongingLayer; + if (!poFeature) + break; + if (std::find(m_layers.begin(), m_layers.end(), poBelongingLayer) != + m_layers.end()) + return poFeature.release(); + } + return nullptr; +} + /************************************************************************/ /* GDALVectorReadAlgorithm::RunStep() */ /************************************************************************/ @@ -49,8 +164,8 @@ bool GDALVectorReadAlgorithm::RunStep(GDALProgressFunc, void *) else { auto poSrcDS = m_inputDataset.GetDatasetRef(); - auto poOutDS = std::make_unique(); - poOutDS->SetDescription(poSrcDS->GetDescription()); + auto poOutDS = + std::make_unique(*poSrcDS); for (const auto &srcLayerName : m_inputLayerNames) { auto poSrcLayer = poSrcDS->GetLayerByName(srcLayerName.c_str()); @@ -61,7 +176,7 @@ bool GDALVectorReadAlgorithm::RunStep(GDALProgressFunc, void *) srcLayerName.c_str()); return false; } - poOutDS->AddLayer(poSrcLayer); + poOutDS->AddLayer(*poSrcLayer); } m_outputDataset.Set(std::move(poOutDS)); } diff --git a/apps/gdalalg_vector_reproject.cpp b/apps/gdalalg_vector_reproject.cpp index fccacbbe1f4b..5d23df2df4ad 100644 --- a/apps/gdalalg_vector_reproject.cpp +++ b/apps/gdalalg_vector_reproject.cpp @@ -65,8 +65,7 @@ bool GDALVectorReprojectAlgorithm::RunStep(GDALProgressFunc, void *) auto poSrcDS = m_inputDataset.GetDatasetRef(); auto reprojectedDataset = - std::make_unique(); - reprojectedDataset->SetDescription(poSrcDS->GetDescription()); + std::make_unique(*poSrcDS); const int nLayerCount = poSrcDS->GetLayerCount(); bool ret = true; @@ -95,10 +94,11 @@ bool GDALVectorReprojectAlgorithm::RunStep(GDALProgressFunc, void *) ret = (poCT != nullptr) && (poReversedCT != nullptr); if (ret) { - reprojectedDataset->AddLayer(std::make_unique( - poSrcLayer, /* iGeomField = */ 0, - /*bTakeOwnership = */ false, poCT.release(), - poReversedCT.release())); + reprojectedDataset->AddLayer( + *poSrcLayer, std::make_unique( + poSrcLayer, /* iGeomField = */ 0, + /*bTakeOwnership = */ false, + poCT.release(), poReversedCT.release())); } } } diff --git a/apps/gdalalg_vector_select.cpp b/apps/gdalalg_vector_select.cpp index 28c10de25f6e..b7a29b0599a8 100644 --- a/apps/gdalalg_vector_select.cpp +++ b/apps/gdalalg_vector_select.cpp @@ -51,7 +51,7 @@ namespace /************************************************************************/ class GDALVectorSelectAlgorithmLayer final - : public OGRLayer, + : public OGRLayerWithTranslateFeature, public OGRGetNextFeatureThroughRaw { private: @@ -257,6 +257,13 @@ class GDALVectorSelectAlgorithmLayer final m_oSrcLayer.ResetReading(); } + void TranslateFeature( + std::unique_ptr poSrcFeature, + std::vector> &apoOutFeatures) override + { + apoOutFeatures.push_back(TranslateFeature(poSrcFeature.release())); + } + OGRFeature *GetNextRawFeature() { auto poSrcFeature = @@ -304,8 +311,7 @@ bool GDALVectorSelectAlgorithm::RunStep(GDALProgressFunc, void *) auto poSrcDS = m_inputDataset.GetDatasetRef(); - auto outDS = std::make_unique(); - outDS->SetDescription(poSrcDS->GetDescription()); + auto outDS = std::make_unique(*poSrcDS); for (auto &&poSrcLayer : poSrcDS->GetLayers()) { @@ -320,7 +326,7 @@ bool GDALVectorSelectAlgorithm::RunStep(GDALProgressFunc, void *) if (!poLayer->IncludeFields(m_fields, !m_ignoreMissingFields)) return false; } - outDS->AddLayer(std::move(poLayer)); + outDS->AddLayer(*poSrcLayer, std::move(poLayer)); } m_outputDataset.Set(std::move(outDS)); diff --git a/apps/gdalalg_vector_write.cpp b/apps/gdalalg_vector_write.cpp index 3d80845862a7..7e92faaad5cd 100644 --- a/apps/gdalalg_vector_write.cpp +++ b/apps/gdalalg_vector_write.cpp @@ -43,6 +43,12 @@ bool GDALVectorWriteAlgorithm::RunStep(GDALProgressFunc pfnProgress, { CPLAssert(m_inputDataset.GetDatasetRef()); + if (m_format == "stream") + { + m_outputDataset.Set(m_inputDataset.GetDatasetRef()); + return true; + } + CPLStringList aosOptions; aosOptions.AddString("--invoked-from-gdal-vector-convert"); if (!m_overwrite) diff --git a/autotest/utilities/test_gdalalg_vector_clip.py b/autotest/utilities/test_gdalalg_vector_clip.py index 0ec6a9fea798..b0f5891adb14 100755 --- a/autotest/utilities/test_gdalalg_vector_clip.py +++ b/autotest/utilities/test_gdalalg_vector_clip.py @@ -920,3 +920,37 @@ def test_gdalalg_vector_clip_like_neither_raster_no_vector(): match="clip: Cannot get extent from clip dataset", ): clip.Run() + + +@pytest.mark.require_driver("OSM") +def test_gdalalg_vector_clip_dataset_getnextfeature(): + + clip = get_clip_alg() + src_ds = gdal.OpenEx("../ogr/data/osm/test.pbf") + clip["input"] = src_ds + clip["bbox"] = [-180, -90, 180, 90] + + assert clip.ParseCommandLineArguments( + ["--of", "stream", "--output", "streamed_output"] + ) + assert clip.Run() + + out_ds = clip["output"].GetDataset() + assert out_ds.TestCapability(ogr.ODsCRandomLayerRead) + + expected = [] + while True: + f, lyr = src_ds.GetNextFeature() + if not f: + break + expected.append((f, lyr)) + + got = [] + out_ds.ResetReading() + while True: + f, lyr = out_ds.GetNextFeature() + if not f: + break + got.append((f, lyr)) + + assert len(expected) == len(got) diff --git a/autotest/utilities/test_gdalalg_vector_pipeline.py b/autotest/utilities/test_gdalalg_vector_pipeline.py index db93707735f7..589f64946a0d 100755 --- a/autotest/utilities/test_gdalalg_vector_pipeline.py +++ b/autotest/utilities/test_gdalalg_vector_pipeline.py @@ -15,7 +15,7 @@ import pytest -from osgeo import gdal +from osgeo import gdal, ogr def get_pipeline_alg(): @@ -47,6 +47,85 @@ def my_progress(pct, msg, user_data): ) +@pytest.mark.require_driver("OSM") +def test_gdalalg_vector_pipeline_read_osm(): + + pipeline = get_pipeline_alg() + assert pipeline.ParseCommandLineArguments( + [ + "read", + "../ogr/data/osm/test.pbf", + "!", + "write", + "--of=stream", + "streamed_file", + ] + ) + assert pipeline.Run() + + out_ds = pipeline["output"].GetDataset() + assert out_ds.TestCapability(ogr.ODsCRandomLayerRead) + + expected = [] + src_ds = gdal.OpenEx("../ogr/data/osm/test.pbf") + while True: + f, _ = src_ds.GetNextFeature() + if not f: + break + expected.append(str(f)) + + got = [] + out_ds.ResetReading() + while True: + f, _ = out_ds.GetNextFeature() + if not f: + break + got.append(str(f)) + + assert expected == got + + +@pytest.mark.require_driver("OSM") +def test_gdalalg_vector_pipeline_read_osm_subset_of_layers(): + + pipeline = get_pipeline_alg() + assert pipeline.ParseCommandLineArguments( + [ + "read", + "../ogr/data/osm/test.pbf", + "--layer=points,multipolygons", + "!", + "write", + "--of=stream", + "streamed_file", + ] + ) + assert pipeline.Run() + + out_ds = pipeline["output"].GetDataset() + assert out_ds.TestCapability(ogr.ODsCRandomLayerRead) + + expected = [] + src_ds = gdal.OpenEx("../ogr/data/osm/test.pbf") + while True: + f, lyr = src_ds.GetNextFeature() + if not f: + break + if lyr.GetName() in ["points", "multipolygons"]: + expected.append(str(f)) + + got = [] + out_ds.ResetReading() + while True: + f, _ = out_ds.GetNextFeature() + if not f: + break + got.append(str(f)) + + assert len(expected) == len(got) + assert expected == got + + def test_gdalalg_vector_pipeline_pipeline_arg(tmp_vsimem): out_filename = str(tmp_vsimem / "out.shp") diff --git a/autotest/utilities/test_gdalalg_vector_reproject.py b/autotest/utilities/test_gdalalg_vector_reproject.py new file mode 100755 index 000000000000..d23faf35766d --- /dev/null +++ b/autotest/utilities/test_gdalalg_vector_reproject.py @@ -0,0 +1,57 @@ +#!/usr/bin/env pytest +# -*- coding: utf-8 -*- +############################################################################### +# Project: GDAL/OGR Test Suite +# Purpose: 'gdal vector reproject' testing +# Author: Even Rouault +# +############################################################################### +# Copyright (c) 2025, Even Rouault +# +# SPDX-License-Identifier: MIT +############################################################################### + +import pytest + +from osgeo import gdal, ogr + + +def get_reproject_alg(): + return gdal.GetGlobalAlgorithmRegistry()["vector"]["reproject"] + + +# Most of the testing is done in test_gdalalg_vector_pipeline.py + + +@pytest.mark.require_driver("OSM") +def test_gdalalg_vector_reproject_dataset_getnextfeature(): + + alg = get_reproject_alg() + src_ds = gdal.OpenEx("../ogr/data/osm/test.pbf") + alg["input"] = src_ds + alg["dst-crs"] = "EPSG:4326" + + assert alg.ParseCommandLineArguments( + ["--of", "stream", "--output", "streamed_output"] + ) + assert alg.Run() + + out_ds = alg["output"].GetDataset() + assert out_ds.TestCapability(ogr.ODsCRandomLayerRead) + + expected = [] + while True: + f, _ = src_ds.GetNextFeature() + if not f: + break + expected.append(str(f)) + + got = [] + out_ds.ResetReading() + while True: + f, _ = out_ds.GetNextFeature() + if not f: + break + got.append(str(f)) + + assert expected == got diff --git a/ogr/ogrsf_frmts/generic/CMakeLists.txt b/ogr/ogrsf_frmts/generic/CMakeLists.txt index a3ebb6142954..20b64b9cf844 100644 --- a/ogr/ogrsf_frmts/generic/CMakeLists.txt +++ b/ogr/ogrsf_frmts/generic/CMakeLists.txt @@ -37,6 +37,7 @@ add_library( ogrunionlayer.cpp ogrlayerpool.cpp ogrlayerdecorator.cpp + ogrlayerwithtranslatefeature.cpp ogreditablelayer.cpp ogrmutexeddatasource.cpp ogrmutexedlayer.cpp diff --git a/ogr/ogrsf_frmts/generic/ogrlayerdecorator.h b/ogr/ogrsf_frmts/generic/ogrlayerdecorator.h index cc56d4584490..4b619ed6d8f9 100644 --- a/ogr/ogrsf_frmts/generic/ogrlayerdecorator.h +++ b/ogr/ogrsf_frmts/generic/ogrlayerdecorator.h @@ -17,7 +17,7 @@ #include "ogrsf_frmts.h" -class CPL_DLL OGRLayerDecorator : public OGRLayer +class CPL_DLL OGRLayerDecorator : virtual public OGRLayer { CPL_DISALLOW_COPY_ASSIGN(OGRLayerDecorator) diff --git a/ogr/ogrsf_frmts/generic/ogrlayerwithtranslatefeature.cpp b/ogr/ogrsf_frmts/generic/ogrlayerwithtranslatefeature.cpp new file mode 100644 index 000000000000..2bfaf1a66e83 --- /dev/null +++ b/ogr/ogrsf_frmts/generic/ogrlayerwithtranslatefeature.cpp @@ -0,0 +1,19 @@ +/****************************************************************************** + * + * Project: OpenGIS Simple Features Reference Implementation + * Purpose: Defines OGRLayerWithTranslateFeature class + * Author: Even Rouault, even dot rouault at spatialys.com + * + ****************************************************************************** + * Copyright (c) 2025, Even Rouault + * + * SPDX-License-Identifier: MIT + ****************************************************************************/ + +#include "ogrlayerwithtranslatefeature.h" + +#ifndef DOXYGEN_SKIP + +OGRLayerWithTranslateFeature::~OGRLayerWithTranslateFeature() = default; + +#endif diff --git a/ogr/ogrsf_frmts/generic/ogrlayerwithtranslatefeature.h b/ogr/ogrsf_frmts/generic/ogrlayerwithtranslatefeature.h new file mode 100644 index 000000000000..355b3774b279 --- /dev/null +++ b/ogr/ogrsf_frmts/generic/ogrlayerwithtranslatefeature.h @@ -0,0 +1,36 @@ +/****************************************************************************** + * + * Project: OpenGIS Simple Features Reference Implementation + * Purpose: Defines OGRLayerWithTranslateFeature class + * Author: Even Rouault, even dot rouault at spatialys.com + * + ****************************************************************************** + * Copyright (c) 2025, Even Rouault + * + * SPDX-License-Identifier: MIT + ****************************************************************************/ + +#ifndef OGRLAYERWITHTRANSLATEFEATURE_H_INCLUDED +#define OGRLAYERWITHTRANSLATEFEATURE_H_INCLUDED + +#ifndef DOXYGEN_SKIP + +#include "ogrsf_frmts.h" + +/** Class that just extends by OGRLayer by mandating a pure virtual method + * TranslateFeature() to be implemented. + */ +class OGRLayerWithTranslateFeature /* non final */ : virtual public OGRLayer +{ + public: + virtual ~OGRLayerWithTranslateFeature(); + + /** Translate the source feature into one or several output features */ + virtual void TranslateFeature( + std::unique_ptr poSrcFeature, + std::vector> &apoOutFeatures) = 0; +}; + +#endif /* DOXYGEN_SKIP */ + +#endif /* OGRLAYERWITHTRANSLATEFEATURE_H_INCLUDED */ diff --git a/ogr/ogrsf_frmts/generic/ogrmutexeddatasource.cpp b/ogr/ogrsf_frmts/generic/ogrmutexeddatasource.cpp index 1d1cf3484f87..0aa84ef6f6be 100644 --- a/ogr/ogrsf_frmts/generic/ogrmutexeddatasource.cpp +++ b/ogr/ogrsf_frmts/generic/ogrmutexeddatasource.cpp @@ -160,7 +160,7 @@ void OGRMutexedDataSource::ReleaseResultSet(OGRLayer *poResultsSet) { std::map::iterator oIter = m_oReverseMapLayers.find( - cpl::down_cast(poResultsSet)); + dynamic_cast(poResultsSet)); CPLAssert(oIter != m_oReverseMapLayers.end()); delete poResultsSet; poResultsSet = oIter->second; diff --git a/ogr/ogrsf_frmts/generic/ogrwarpedlayer.cpp b/ogr/ogrsf_frmts/generic/ogrwarpedlayer.cpp index a69205500e82..28b7ed486162 100644 --- a/ogr/ogrsf_frmts/generic/ogrwarpedlayer.cpp +++ b/ogr/ogrsf_frmts/generic/ogrwarpedlayer.cpp @@ -101,6 +101,18 @@ OGRErr OGRWarpedLayer::ISetSpatialFilter(int iGeomField, } } +/************************************************************************/ +/* TranslateFeature() */ +/************************************************************************/ + +void OGRWarpedLayer::TranslateFeature( + std::unique_ptr poSrcFeature, + std::vector> &apoOutFeatures) +{ + apoOutFeatures.push_back( + SrcFeatureToWarpedFeature(std::move(poSrcFeature))); +} + /************************************************************************/ /* SrcFeatureToWarpedFeature() */ /************************************************************************/ diff --git a/ogr/ogrsf_frmts/generic/ogrwarpedlayer.h b/ogr/ogrsf_frmts/generic/ogrwarpedlayer.h index 468f7e138f11..f5fd6a634eb4 100644 --- a/ogr/ogrsf_frmts/generic/ogrwarpedlayer.h +++ b/ogr/ogrsf_frmts/generic/ogrwarpedlayer.h @@ -16,13 +16,22 @@ #ifndef DOXYGEN_SKIP #include "ogrlayerdecorator.h" +#include "ogrlayerwithtranslatefeature.h" + #include +#if defined(_MSC_VER) +#pragma warning(push) +// Silence warnings of the type warning C4250: 'OGRWarpedLayer': inherits 'OGRLayerDecorator::OGRLayerDecorator::GetMetadata' via dominance +#pragma warning(disable : 4250) +#endif + /************************************************************************/ /* OGRWarpedLayer */ /************************************************************************/ -class CPL_DLL OGRWarpedLayer : public OGRLayerDecorator +class CPL_DLL OGRWarpedLayer : public OGRLayerDecorator, + public OGRLayerWithTranslateFeature { CPL_DISALLOW_COPY_ASSIGN(OGRWarpedLayer) @@ -53,6 +62,10 @@ class CPL_DLL OGRWarpedLayer : public OGRLayerDecorator poReversedCT /* may be NULL, ownership acquired by OGRWarpedLayer */); virtual ~OGRWarpedLayer(); + void TranslateFeature( + std::unique_ptr poSrcFeature, + std::vector> &apoOutFeatures) override; + void SetExtent(double dfXMin, double dfYMin, double dfXMax, double dfYMax); virtual OGRErr ISetSpatialFilter(int iGeomField, @@ -83,6 +96,10 @@ class CPL_DLL OGRWarpedLayer : public OGRLayerDecorator CSLConstList papszOptions = nullptr) override; }; +#if defined(_MSC_VER) +#pragma warning(pop) +#endif + #endif /* #ifndef DOXYGEN_SKIP */ #endif // OGRWARPEDLAYER_H_INCLUDED From ca3cb8c2bf3a8f97e8fae9153a36bb268559a9bc Mon Sep 17 00:00:00 2001 From: Even Rouault Date: Tue, 18 Feb 2025 18:39:21 +0100 Subject: [PATCH 8/9] Doc: add Gulf of Mexico nickname --- NEWS.md | 2 +- doc/source/about_no_title.rst | 2 +- doc/source/download.rst | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/NEWS.md b/NEWS.md index a0427eecb781..a976003c5cb1 100644 --- a/NEWS.md +++ b/NEWS.md @@ -360,7 +360,7 @@ XODR driver: * Fix typo in handling of Translate widthPct, heightPct * add relatedFieldNameMatch parameter to gdal.VectorTranslate() -# GDAL/OGR 3.10.2 Release Notes +# GDAL/OGR 3.10.2 "Gulf of Mexico" Release Notes GDAL 3.10.2 is a bugfix release. diff --git a/doc/source/about_no_title.rst b/doc/source/about_no_title.rst index 0c967d4b28ad..ccb02739c95e 100644 --- a/doc/source/about_no_title.rst +++ b/doc/source/about_no_title.rst @@ -1,4 +1,4 @@ -GDAL is a translator library for raster and vector geospatial data formats that is released under an MIT style Open Source :ref:`license` by the `Open Source Geospatial Foundation`_. As a library, it presents a single raster abstract data model and single vector abstract data model to the calling application for all supported formats. It also comes with a variety of useful command line utilities for data translation and processing. The `NEWS`_ page describes the February 2025 GDAL/OGR 3.10.2 release. +GDAL is a translator library for raster and vector geospatial data formats that is released under an MIT style Open Source :ref:`license` by the `Open Source Geospatial Foundation`_. As a library, it presents a single raster abstract data model and single vector abstract data model to the calling application for all supported formats. It also comes with a variety of useful command line utilities for data translation and processing. The `NEWS`_ page describes the February 2025 GDAL/OGR 3.10.2 "Gulf Of Mexico" release. .. only:: html diff --git a/doc/source/download.rst b/doc/source/download.rst index d11a13e7645a..c181361129a2 100644 --- a/doc/source/download.rst +++ b/doc/source/download.rst @@ -18,7 +18,7 @@ Source Code Current Release ............... -* **2025-02-14** `gdal-3.10.2.tar.gz`_ `3.10.2 Release Notes`_ (`3.10.2 md5`_) +* **2025-02-14** `gdal-3.10.2.tar.gz`_ `3.10.2 "Gulf of Mexico" Release Notes`_ (`3.10.2 md5`_) .. _`3.10.2 Release Notes`: https://github.com/OSGeo/gdal/blob/v3.10.2/NEWS.md .. _`gdal-3.10.2.tar.gz`: https://github.com/OSGeo/gdal/releases/download/v3.10.2/gdal-3.10.2.tar.gz From 3e34cfe067fd6a9d593f4760e8cdf67524bb181f Mon Sep 17 00:00:00 2001 From: Even Rouault Date: Tue, 18 Feb 2025 19:35:30 +0100 Subject: [PATCH 9/9] Fix doc building --- doc/source/download.rst | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/doc/source/download.rst b/doc/source/download.rst index c181361129a2..f39f7091c056 100644 --- a/doc/source/download.rst +++ b/doc/source/download.rst @@ -20,7 +20,7 @@ Current Release * **2025-02-14** `gdal-3.10.2.tar.gz`_ `3.10.2 "Gulf of Mexico" Release Notes`_ (`3.10.2 md5`_) -.. _`3.10.2 Release Notes`: https://github.com/OSGeo/gdal/blob/v3.10.2/NEWS.md +.. _`3.10.2 "Gulf of Mexico" Release Notes`: https://github.com/OSGeo/gdal/blob/v3.10.2/NEWS.md .. _`gdal-3.10.2.tar.gz`: https://github.com/OSGeo/gdal/releases/download/v3.10.2/gdal-3.10.2.tar.gz .. _`3.10.2 md5`: https://github.com/OSGeo/gdal/releases/download/v3.10.2/gdal-3.10.2.tar.gz.md5