forked from amazingfate/loongoffice
dependency for XLOOKUP and XMATCH because of better compatibility. The idea is to specify, that the global setting 'search-criteria-must-apply-to-whole-cell' is ignored and XMATCH and XLOOKUP always behaves as if 'search-criteria-must-apply-to-whole-cell'=true. That would affect exact search in Match_mode value 0. Users would need to use wildcard or regex to get a match to part of the content. But removing dependency to the global setting increases interoperability with MS Excel. Also the ODF TC will follow that in the final specification of these functions: https://issues.oasis-open.org/browse/OFFICE-4154 Follow-up commit: 17d578ba91f9c78a0e41d19b58183d2214c0b7a4 (Related: tdf#127293 Add new Match_mode option for XLOOKUP and XMATCH functions.) Change-Id: I1317865631d2925eaff72e9c1425d93386c3d016 Reviewed-on: https://gerrit.libreoffice.org/c/core/+/169582 Reviewed-by: Balazs Varga <balazs.varga.extern@allotropia.de> Reviewed-by: Regina Henschel <rb.henschel@t-online.de> Tested-by: Jenkins
277 lines
11 KiB
C++
277 lines
11 KiB
C++
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/*
|
|
* This file is part of the LibreOffice project.
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*
|
|
* This file incorporates work covered by the following license notice:
|
|
*
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
* contributor license agreements. See the NOTICE file distributed
|
|
* with this work for additional information regarding copyright
|
|
* ownership. The ASF licenses this file to you under the Apache
|
|
* License, Version 2.0 (the "License"); you may not use this file
|
|
* except in compliance with the License. You may obtain a copy of
|
|
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
|
|
*/
|
|
|
|
#include <rangecache.hxx>
|
|
#include <cellvalue.hxx>
|
|
#include <document.hxx>
|
|
#include <brdcst.hxx>
|
|
#include <queryevaluator.hxx>
|
|
#include <queryparam.hxx>
|
|
|
|
#include <sal/log.hxx>
|
|
#include <svl/numformat.hxx>
|
|
#include <unotools/collatorwrapper.hxx>
|
|
|
|
static bool needsDescending(ScQueryOp op)
|
|
{
|
|
assert(op == SC_GREATER || op == SC_GREATER_EQUAL || op == SC_LESS || op == SC_LESS_EQUAL
|
|
|| op == SC_EQUAL);
|
|
// We want all matching values to start in the sort order,
|
|
// since the data is searched from start until the last matching one.
|
|
return op == SC_GREATER || op == SC_GREATER_EQUAL;
|
|
}
|
|
|
|
static ScSortedRangeCache::ValueType toValueType(const ScQueryParam& param)
|
|
{
|
|
assert(param.GetEntry(0).bDoQuery && !param.GetEntry(1).bDoQuery
|
|
&& param.GetEntry(0).GetQueryItems().size() == 1);
|
|
assert(param.GetEntry(0).GetQueryItem().meType == ScQueryEntry::ByString
|
|
|| param.GetEntry(0).GetQueryItem().meType == ScQueryEntry::ByValue);
|
|
if (param.GetEntry(0).GetQueryItem().meType == ScQueryEntry::ByValue)
|
|
return ScSortedRangeCache::ValueType::Values;
|
|
return param.bCaseSens ? ScSortedRangeCache::ValueType::StringsCaseSensitive
|
|
: ScSortedRangeCache::ValueType::StringsCaseInsensitive;
|
|
}
|
|
|
|
ScSortedRangeCache::ScSortedRangeCache(ScDocument* pDoc, const ScRange& rRange,
|
|
const ScQueryParam& param, ScInterpreterContext* context,
|
|
bool invalid, bool bNewSearchFunction,
|
|
sal_uInt8 nSortedBinarySearch)
|
|
: maRange(rRange)
|
|
, mpDoc(pDoc)
|
|
, mValid(false)
|
|
, mRowSearch(param.bByRow)
|
|
, mValueType(toValueType(param))
|
|
{
|
|
if (mRowSearch)
|
|
assert(maRange.aStart.Col() == maRange.aEnd.Col());
|
|
else
|
|
assert(maRange.aStart.Row() == maRange.aEnd.Row());
|
|
assert(maRange.aStart.Tab() == maRange.aEnd.Tab());
|
|
SCTAB nTab = maRange.aStart.Tab();
|
|
assert(param.GetEntry(0).bDoQuery && !param.GetEntry(1).bDoQuery
|
|
&& param.GetEntry(0).GetQueryItems().size() == 1);
|
|
const ScQueryEntry& entry = param.GetEntry(0);
|
|
const ScQueryEntry::Item& item = entry.GetQueryItem();
|
|
mQueryOp = entry.eOp;
|
|
mQueryType = item.meType;
|
|
|
|
if (invalid)
|
|
return; // leave empty
|
|
|
|
SCROW startRow = maRange.aStart.Row();
|
|
SCROW endRow = maRange.aEnd.Row();
|
|
SCCOL startCol = maRange.aStart.Col();
|
|
SCCOL endCol = maRange.aEnd.Col();
|
|
if (!item.mbMatchEmpty)
|
|
if (!pDoc->ShrinkToDataArea(nTab, startCol, startRow, endCol, endRow))
|
|
return; // no data cells, no need for a cache
|
|
|
|
if (mValueType == ValueType::Values)
|
|
{
|
|
struct ColRowData
|
|
{
|
|
SCCOLROW col_row;
|
|
double value;
|
|
};
|
|
|
|
std::vector<ColRowData> colrowData;
|
|
for (SCCOL nCol = startCol; nCol <= endCol; ++nCol)
|
|
{
|
|
for (SCROW nRow = startRow; nRow <= endRow; ++nRow)
|
|
{
|
|
ScRefCellValue cell(pDoc->GetRefCellValue(ScAddress(nCol, nRow, nTab)));
|
|
if (ScQueryEvaluator::isQueryByValue(mQueryOp, mQueryType, cell))
|
|
colrowData.push_back(ColRowData{ mRowSearch ? nRow : nCol, cell.getValue() });
|
|
else if (ScQueryEvaluator::isQueryByString(mQueryOp, mQueryType, cell))
|
|
{
|
|
// Make sure that other possibilities in the generic handling
|
|
// in ScQueryEvaluator::processEntry() do not alter the results.
|
|
// (ByTextColor/ByBackgroundColor are blocked by CanBeUsedForSorterCache(),
|
|
// but isQueryByString() is possible if the cell content is a string.
|
|
// And including strings here would be tricky, as the string comparison
|
|
// may possibly(?) be different than a numeric one. So check if the string
|
|
// may possibly match a number, by converting it to one. If it can't match,
|
|
// then it's fine to ignore it (and it can happen e.g. if the query uses
|
|
// the whole column which includes a textual header). But if it can possibly
|
|
// match, then bail out and leave it to the unoptimized case.
|
|
// TODO Maybe it would actually work to use the numeric value obtained here?
|
|
if (!bNewSearchFunction && !ScQueryEvaluator::isMatchWholeCell(*pDoc, mQueryOp))
|
|
return; // substring matching cannot be sorted, but new search functions are sorted
|
|
sal_uInt32 format = 0;
|
|
double value;
|
|
if (context->NFIsNumberFormat(cell.getString(pDoc), format, value))
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (nSortedBinarySearch == 0x00) //nBinarySearchDisabled = 0x00
|
|
{
|
|
std::stable_sort(
|
|
colrowData.begin(), colrowData.end(),
|
|
[](const ColRowData& d1, const ColRowData& d2) { return d1.value < d2.value; });
|
|
}
|
|
else if (nSortedBinarySearch == 0x01) //nSearchbAscd
|
|
{
|
|
// expected it is already sorted properly in Ascd mode.
|
|
}
|
|
else /*(nSortedBinarySearch == 0x02) nSearchbDesc*/
|
|
{
|
|
// expected it is already sorted properly in Desc mode, just need to reverse.
|
|
std::reverse(colrowData.begin(), colrowData.end());
|
|
}
|
|
|
|
if (needsDescending(entry.eOp))
|
|
{
|
|
for (auto it = colrowData.rbegin(); it != colrowData.rend(); ++it)
|
|
{
|
|
if (mRowSearch)
|
|
mSortedRows.emplace_back(it->col_row);
|
|
else
|
|
mSortedCols.emplace_back(it->col_row);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
for (const ColRowData& d : colrowData)
|
|
{
|
|
if (mRowSearch)
|
|
mSortedRows.emplace_back(d.col_row);
|
|
else
|
|
mSortedCols.emplace_back(d.col_row);
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
struct ColRowData
|
|
{
|
|
SCCOLROW col_row;
|
|
OUString string;
|
|
};
|
|
std::vector<ColRowData> colrowData;
|
|
// Try to reuse as much ScQueryEvaluator code as possible, this should
|
|
// basically do the same comparisons.
|
|
assert(pDoc->FetchTable(nTab) != nullptr);
|
|
ScQueryEvaluator evaluator(*pDoc, *pDoc->FetchTable(nTab), param, context, nullptr,
|
|
bNewSearchFunction);
|
|
for (SCCOL nCol = startCol; nCol <= endCol; ++nCol)
|
|
{
|
|
for (SCROW nRow = startRow; nRow <= endRow; ++nRow)
|
|
{
|
|
ScRefCellValue cell(pDoc->GetRefCellValue(ScAddress(nCol, nRow, nTab)));
|
|
// This should be used only with ScQueryEntry::ByString, and that
|
|
// means that ScQueryEvaluator::isQueryByString() should be the only
|
|
// possibility in the generic handling in ScQueryEvaluator::processEntry()
|
|
// (ByTextColor/ByBackgroundColor are blocked by CanBeUsedForSorterCache(),
|
|
// and isQueryByValue() is blocked by ScQueryEntry::ByString).
|
|
assert(mQueryType == ScQueryEntry::ByString);
|
|
assert(!ScQueryEvaluator::isQueryByValue(mQueryOp, mQueryType, cell));
|
|
if (ScQueryEvaluator::isQueryByString(mQueryOp, mQueryType, cell))
|
|
{
|
|
const svl::SharedString* sharedString = nullptr;
|
|
OUString string = evaluator.getCellString(cell, nRow, nCol, &sharedString);
|
|
if (sharedString)
|
|
string = sharedString->getString();
|
|
colrowData.push_back(ColRowData{ mRowSearch ? nRow : nCol, string });
|
|
}
|
|
}
|
|
}
|
|
CollatorWrapper& collator
|
|
= ScGlobal::GetCollator(mValueType == ValueType::StringsCaseSensitive);
|
|
|
|
if (nSortedBinarySearch == 0x00) //nBinarySearchDisabled = 0x00
|
|
{
|
|
std::stable_sort(colrowData.begin(), colrowData.end(),
|
|
[&collator](const ColRowData& d1, const ColRowData& d2) {
|
|
return collator.compareString(d1.string, d2.string) < 0;
|
|
});
|
|
}
|
|
else if (nSortedBinarySearch == 0x01) //nSearchbAscd
|
|
{
|
|
// expected it is already sorted properly in Asc mode.
|
|
}
|
|
else /*(nSortedBinarySearch == 0x02) nSearchbDesc*/
|
|
{
|
|
// expected it is already sorted properly in Desc mode, just need to reverse.
|
|
std::reverse(colrowData.begin(), colrowData.end());
|
|
}
|
|
|
|
if (needsDescending(entry.eOp))
|
|
{
|
|
for (auto it = colrowData.rbegin(); it != colrowData.rend(); ++it)
|
|
{
|
|
if (mRowSearch)
|
|
mSortedRows.emplace_back(it->col_row);
|
|
else
|
|
mSortedCols.emplace_back(it->col_row);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
for (const ColRowData& d : colrowData)
|
|
{
|
|
if (mRowSearch)
|
|
mSortedRows.emplace_back(d.col_row);
|
|
else
|
|
mSortedCols.emplace_back(d.col_row);
|
|
}
|
|
}
|
|
}
|
|
|
|
if (mRowSearch)
|
|
{
|
|
mRowToIndex.resize(maRange.aEnd.Row() - maRange.aStart.Row() + 1, mSortedRows.max_size());
|
|
for (size_t i = 0; i < mSortedRows.size(); ++i)
|
|
mRowToIndex[mSortedRows[i] - maRange.aStart.Row()] = i;
|
|
}
|
|
else
|
|
{
|
|
mColToIndex.resize(maRange.aEnd.Col() - maRange.aStart.Col() + 1, mSortedCols.max_size());
|
|
for (size_t i = 0; i < mSortedCols.size(); ++i)
|
|
mColToIndex[mSortedCols[i] - maRange.aStart.Col()] = i;
|
|
}
|
|
mValid = true;
|
|
}
|
|
|
|
void ScSortedRangeCache::Notify(const SfxHint& rHint)
|
|
{
|
|
if (!mpDoc->IsInDtorClear())
|
|
{
|
|
if (rHint.GetId() == SfxHintId::ScDataChanged || rHint.GetId() == SfxHintId::ScAreaChanged)
|
|
{
|
|
mpDoc->RemoveSortedRangeCache(*this);
|
|
// this ScSortedRangeCache is deleted by RemoveSortedRangeCache
|
|
}
|
|
}
|
|
}
|
|
|
|
ScSortedRangeCache::HashKey ScSortedRangeCache::makeHashKey(const ScRange& range,
|
|
const ScQueryParam& param)
|
|
{
|
|
assert(param.GetEntry(0).bDoQuery && !param.GetEntry(1).bDoQuery
|
|
&& param.GetEntry(0).GetQueryItems().size() == 1);
|
|
const ScQueryEntry& entry = param.GetEntry(0);
|
|
const ScQueryEntry::Item& item = entry.GetQueryItem();
|
|
return { range, toValueType(param), entry.eOp, item.meType };
|
|
}
|
|
|
|
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|