// SPDX-FileCopyrightText: 2020 Kitsune Ral // SPDX-License-Identifier: LGPL-2.1-or-later #include "uri.h" #include "logging.h" #include using namespace Quotient; struct ReplacePair { QByteArray uriString; char sigil; }; /// \brief Defines bi-directional mapping of path prefixes and sigils /// /// When there are two prefixes for the same sigil, the first matching /// entry for a given sigil is used. static const auto replacePairs = { ReplacePair { "u/", '@' }, { "user/", '@' }, { "roomid/", '!' }, { "r/", '#' }, { "room/", '#' }, // The notation for bare event ids is not proposed in MSC2312 but there's // https://github.com/matrix-org/matrix-doc/pull/2644 { "e/", '$' }, { "event/", '$' } }; Uri::Uri(QByteArray primaryId, QByteArray secondaryId, QString query) { if (primaryId.isEmpty()) primaryType_ = Empty; else { setScheme("matrix"); QString pathToBe; primaryType_ = Invalid; if (primaryId.size() < 2) // There should be something after sigil return; for (const auto& p: replacePairs) if (primaryId[0] == p.sigil) { primaryType_ = Type(p.sigil); auto safePrimaryId = primaryId.mid(1); safePrimaryId.replace('/', "%2F"); pathToBe = p.uriString + safePrimaryId; break; } if (!secondaryId.isEmpty()) { if (secondaryId.size() < 2) { primaryType_ = Invalid; return; } auto safeSecondaryId = secondaryId.mid(1); safeSecondaryId.replace('/', "%2F"); pathToBe += "/event/" + safeSecondaryId; } setPath(pathToBe, QUrl::TolerantMode); } if (!query.isEmpty()) setQuery(query); } static inline auto encodedPath(const QUrl& url) { return url.path(QUrl::EncodeDelimiters | QUrl::EncodeUnicode); } static QString pathSegment(const QUrl& url, int which) { return QUrl::fromPercentEncoding( encodedPath(url).section('/', which, which).toUtf8()); } static auto decodeFragmentPart(const QStringRef& part) { return QUrl::fromPercentEncoding(part.toLatin1()).toUtf8(); } static auto matrixToUrlRegexInit() { // See https://matrix.org/docs/spec/appendices#matrix-to-navigation const QRegularExpression MatrixToUrlRE { "^/(?
[^:]+:[^/?]+)(/(?(\\$|%24)[^?]+))?(\\?(?.+))?$" }; Q_ASSERT(MatrixToUrlRE.isValid()); return MatrixToUrlRE; } Uri::Uri(QUrl url) : QUrl(std::move(url)) { // NB: don't try to use `url` from here on, it's moved-from and empty if (isEmpty()) return; // primaryType_ == Empty primaryType_ = Invalid; if (!QUrl::isValid()) // MatrixUri::isValid() checks primaryType_ return; if (scheme() == "matrix") { // Check sanity as per https://github.com/matrix-org/matrix-doc/pull/2312 const auto& urlPath = encodedPath(*this); const auto& splitPath = urlPath.splitRef('/'); switch (splitPath.size()) { case 2: break; case 4: if (splitPath[2] == "event" || splitPath[2] == "e") break; [[fallthrough]]; default: return; // Invalid } for (const auto& p: replacePairs) if (urlPath.startsWith(p.uriString)) { primaryType_ = Type(p.sigil); return; // The only valid return path for matrix: URIs } qCDebug(MAIN) << "The matrix: URI is not recognised:" << toDisplayString(); return; } primaryType_ = NonMatrix; // Default, unless overridden by the code below if (scheme() == "https" && authority() == "matrix.to") { static const auto MatrixToUrlRE = matrixToUrlRegexInit(); // matrix.to accepts both literal sigils (as well as & and ? used in // its "query" substitute) and their %-encoded forms; // so force QUrl to decode everything. auto f = fragment(QUrl::EncodeUnicode); if (auto&& m = MatrixToUrlRE.match(f); m.hasMatch()) *this = Uri { decodeFragmentPart(m.capturedRef("main")), decodeFragmentPart(m.capturedRef("sec")), decodeFragmentPart(m.capturedRef("query")) }; } } Uri::Uri(const QString& uriOrId) : Uri(fromUserInput(uriOrId)) {} Uri Uri::fromUserInput(const QString& uriOrId) { if (uriOrId.isEmpty()) return {}; // type() == None // A quick check if uriOrId is a plain Matrix id // Bare event ids cannot be resolved without a room scope as per the current // spec but there's a movement towards making them navigable (see, e.g., // https://github.com/matrix-org/matrix-doc/pull/2644) - so treat them // as valid if (QStringLiteral("!@#+$").contains(uriOrId[0])) return Uri { uriOrId.toUtf8() }; return Uri { QUrl::fromUserInput(uriOrId) }; } Uri::Type Uri::type() const { return primaryType_; } Uri::SecondaryType Uri::secondaryType() const { const auto& type2 = pathSegment(*this, 2); return type2 == "event" || type2 == "e" ? EventId : NoSecondaryId; } QUrl Uri::toUrl(UriForm form) const { if (!isValid()) return {}; if (form == CanonicalUri || type() == NonMatrix) return *this; // NOLINT(cppcoreguidelines-slicing): It's intentional QUrl url; url.setScheme("https"); url.setHost("matrix.to"); url.setPath("/"); auto fragment = '/' + primaryId(); if (const auto& secId = secondaryId(); !secId.isEmpty()) fragment += '/' + secId; if (const auto& q = query(); !q.isEmpty()) fragment += '?' + q; url.setFragment(fragment); return url; } QString Uri::primaryId() const { if (primaryType_ == Empty || primaryType_ == Invalid) return {}; const auto& idStem = pathSegment(*this, 1); return idStem.isEmpty() ? idStem : primaryType_ + idStem; } QString Uri::secondaryId() const { const auto& idStem = pathSegment(*this, 3); return idStem.isEmpty() ? idStem : secondaryType() + idStem; } static const auto ActionKey = QStringLiteral("action"); QString Uri::action() const { return type() == NonMatrix || !isValid() ? QString() : QUrlQuery { query() }.queryItemValue(ActionKey); } void Uri::setAction(const QString& newAction) { if (!isValid()) { qCWarning(MAIN) << "Cannot set an action on an invalid Quotient::Uri"; return; } QUrlQuery q { query() }; q.removeQueryItem(ActionKey); q.addQueryItem(ActionKey, newAction); setQuery(q); } QStringList Uri::viaServers() const { return QUrlQuery { query() }.allQueryItemValues(QStringLiteral("via"), QUrl::EncodeReserved); } bool Uri::isValid() const { return primaryType_ != Empty && primaryType_ != Invalid; }