// Copyright 2019 The Chromium Authors // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include #include #include "content/browser/sms/sms_parser.h" #include "base/strings/string_piece.h" #include "net/base/url_util.h" #include "third_party/abseil-cpp/absl/types/optional.h" #include "third_party/re2/src/re2/re2.h" #include "url/gurl.h" #include "url/origin.h" namespace content { namespace { // SMS one-time-passcode format: // https://wicg.github.io/sms-one-time-codes/#parsing constexpr char kOtpFormatRegex[] = "(?:^|\\s)" // Leading characters "@([a-zA-Z0-9.-]+) " // Domain "#([^#\\s]+)" // OTP "(?: @([a-zA-Z0-9.-]+))?"; // Optional domain using SmsParsingStatus = SmsParser::SmsParsingStatus; using ParseDomainResult = std::tuple; ParseDomainResult ParseDomain(const std::string& domain) { std::string host, scheme; int port; if (!net::ParseHostAndPort(domain, &host, &port)) return std::make_tuple(SmsParsingStatus::kHostAndPortNotParsed, GURL()); // Expect localhost to always be http. if (net::HostStringIsLocalhost(base::StringPiece(host))) { scheme = "http://"; } else { scheme = "https://"; } GURL gurl = GURL(scheme + domain); if (!gurl.is_valid()) return std::make_tuple(SmsParsingStatus::kGURLNotValid, GURL()); return std::make_tuple(SmsParsingStatus::kParsed, gurl); } } // namespace SmsParser::Result::Result(SmsParsingStatus status) : parsing_status(status) { DCHECK(parsing_status != SmsParsingStatus::kParsed); } SmsParser::Result::Result(const url::Origin& top_origin, const url::Origin& embedded_origin, const std::string& one_time_code) : top_origin(std::move(top_origin)), embedded_origin(std::move(embedded_origin)), one_time_code(one_time_code) { parsing_status = SmsParsingStatus::kParsed; } SmsParser::Result::Result(const Result& other) = default; SmsParser::Result::~Result() = default; OriginList SmsParser::Result::GetOriginList() const { DCHECK(IsValid()); OriginList origin_list; if (!embedded_origin.opaque()) origin_list.push_back(embedded_origin); origin_list.push_back(top_origin); return origin_list; } // static SmsParser::Result SmsParser::Parse(base::StringPiece sms) { std::string top_domain, otp, embedded_domain; // TODO(yigu): The existing kOtpFormatRegex may filter out invalid SMSes that // would fall into |kHostAndPortNotParsed| or |kGURLNotValid| below. We should // clean up the code if the statement is confirmed by metrics. if (!re2::RE2::PartialMatch(std::string(sms), kOtpFormatRegex, &top_domain, &otp, &embedded_domain)) return Result(SmsParsingStatus::kOTPFormatRegexNotMatch); auto [top_domain_parsing_status, top_gurl] = ParseDomain(top_domain); if (top_domain_parsing_status != SmsParsingStatus::kParsed) return Result(top_domain_parsing_status); DCHECK(top_gurl.is_valid()); url::Origin top_origin = url::Origin::Create(top_gurl); DCHECK(!top_origin.opaque()); if (embedded_domain == "") return Result(top_origin, url::Origin(), otp); auto [embedded_domain_parsing_status, embedded_gurl] = ParseDomain(embedded_domain); if (embedded_domain_parsing_status != SmsParsingStatus::kParsed) return Result(embedded_domain_parsing_status); DCHECK(embedded_gurl.is_valid()); url::Origin embedded_origin = url::Origin::Create(embedded_gurl); DCHECK(!embedded_origin.opaque()); return Result(top_origin, embedded_origin, otp); } } // namespace content