From 18dd4f9479ea443eaa34173ae2e7abbebfec3a82 Mon Sep 17 00:00:00 2001
From: Alexei Cazacov <alexei.cazacov@qt.io>
Date: Wed, 26 Feb 2025 14:56:48 +0200
Subject: [PATCH] Doc: Move 'Classes for string data' topic to Qt Core and add
 it to TOC

Fixes: QTBUG-133954
Change-Id: If51abefc39eaae29f7d533af2974017793ef9358
Reviewed-by: Matthias Rauter <matthias.rauter@qt.io>
(cherry picked from commit baeed8e1e75db988aa53aa56353aa9c1f821b542)
Reviewed-by: Qt Cherry-pick Bot <cherrypick_bot@qt-project.org>
---
 src/corelib/doc/images/string_class_api.svg   | 234 ++++++++++
 .../doc/images/string_class_calling.svg       | 266 ++++++++++++
 src/corelib/doc/src/qstring-overview.qdoc     | 410 ++++++++++++++++++
 src/corelib/doc/src/qtcore-toc.qdoc           |   3 +-
 4 files changed, 912 insertions(+), 1 deletion(-)
 create mode 100644 src/corelib/doc/images/string_class_api.svg
 create mode 100644 src/corelib/doc/images/string_class_calling.svg
 create mode 100644 src/corelib/doc/src/qstring-overview.qdoc
diff --git a/src/corelib/doc/images/string_class_api.svg b/src/corelib/doc/images/string_class_api.svg
new file mode 100644
index 00000000000..c46b40d1bf3
--- /dev/null
+++ b/src/corelib/doc/images/string_class_api.svg
@@ -0,0 +1,234 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+  viewBox="-410 -30 540 440"
+  version="1.1"
+  xmlns="http://www.w3.org/2000/svg"
+  xmlns:svg="http://www.w3.org/2000/svg">
+  <defs>
+    <path id="raute"
+      fill="#cfe7f5"
+      stroke="black"
+      stroke-width="1px"
+      d="m 0 -40 L 80 0 L 0 40 L -80 0 z" />
+    <path id="lozenge"
+      fill="#cfe7f5"
+      stroke="black"
+      stroke-width="1px"
+      d="M -60,-20
+         h 120
+         a 20,20 0 0 1 20,20
+         v 0
+         a 20,20 0 0 1 -20,20
+         h -120
+         a 20,20 0 0 1 -20,-20
+         v 0
+         a 20,20 0 0 1 20,-20
+         Z"/>
+    <path id="lozenge_small"
+      fill="#cfe7f5"
+      stroke="black"
+      stroke-width="1px"
+      d="M -40,-20
+         h 80
+         a 20,20 0 0 1 20,20
+         v 0
+         a 20,20 0 0 1 -20,20
+         h -80
+         a 20,20 0 0 1 -20,-20
+         v 0
+         a 20,20 0 0 1 20,-20
+         Z"/>
+    <marker
+      id="triangle"
+      viewBox="0 0 10 10"
+      refX="1"
+      refY="5"
+      markerUnits="strokeWidth"
+      markerWidth="10"
+      markerHeight="10"
+      orient="auto">
+      <path d="M 0 0 L 10 5 L 0 10 z" fill="black" />
+    </marker>
+  </defs>
+
+  <g id="start" transform="translate(-160, 0)">
+    <use href="#lozenge_small" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -6)">
+      <tspan x="0" dy="0em">String class</tspan>
+      <tspan x="0" dy="1.2em">for creating API</tspan>
+    </text>
+  </g>
+
+  <g id="param_or_return" transform="translate(-160, 100)">
+   <use href="#raute" />
+   <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -6)">
+      <tspan x="0" dy="0em">parameter or</tspan>
+      <tspan x="0" dy="1.2em">return value?</tspan>
+  </text>
+  </g>
+
+  <g id="make_copy" transform="translate(-320, 200)">
+    <use href="#raute" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -6)">
+      <tspan x="0" dy="0em">Will you make</tspan>
+      <tspan x="0" dy="1.2em">a persistent copy?</tspan>
+    </text>
+  </g>
+
+  <g id="ref_or_perm" transform="translate(40, 200)">
+    <use href="#raute" />
+     <text
+       font-size="12" fill="black"
+       text-anchor="middle" dominant-baseline="middle"
+       transform="translate(0, -12)">
+       <tspan x="0" dy="0em">Reference to</tspan>
+       <tspan x="0" dy="1.2em">permanent or</tspan>
+       <tspan x="0" dy="1.2em">temporary?</tspan>
+  </text>
+  </g>
+
+  <g id="make_copy" transform="translate(-80, 300)">
+    <use href="#raute" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -6)">
+      <tspan x="0" dy="0em">Reference to full</tspan>
+      <tspan x="0" dy="1.2em">or part?</tspan>
+    </text>
+  </g>
+
+  <g id="const_ref" transform="translate(-320, 300)">
+    <use href="#lozenge" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle" >
+      <tspan x="0" dy="0em">const QString&amp;</tspan>
+    </text>
+  </g>
+
+  <g id="anystringview" transform="translate(-200, 380)">
+    <use href="#lozenge" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -8)" >
+      <tspan x="0" dy="0em">Q*StringView</tspan>
+      <tspan font-size="8" x="0" dy="1.4em">parameters preferably QAnyStringView</tspan>
+      <tspan font-size="8" x="0" dy="1.2em">or any of L1, UTF8, or UTF16</tspan>
+    </text>
+  </g>
+
+
+  <g id="anystringview" transform="translate(40, 380)">
+    <use href="#lozenge" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle" >
+      <tspan x="0" dy="0em">QString</tspan>
+    </text>
+  </g>
+
+  <g transform="translate(-160, 20)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 0 30" />
+  </g>
+
+  <g transform="translate(-240, 100)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l -80 0 l 0 50" />
+    <text x="-40" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      parameter
+    </text>
+  </g>
+
+  <g transform="translate(-80, 100)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 120 0 l 0 50" />
+    <text x="60" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      return value
+    </text>
+  </g>
+
+  <g transform="translate(-320, 240)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 0 30" />
+    <text x="5" y="15"
+      font-size="12" fill="black"
+      text-anchor="left" dominant-baseline="middle">
+      yes
+    </text>
+  </g>
+
+  <g transform="translate(-240, 200)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 40 0 l 0 150" />
+    <text x="20" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      no
+    </text>
+  </g>
+
+  <g transform="translate(-40, 200)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l -40 0 l 0 50" />
+    <text x="-20" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      reference
+    </text>
+  </g>
+
+  <g transform="translate(-160, 300)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l -70 0" />
+    <text x="-20" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      full
+    </text>
+  </g>
+
+  <g transform="translate(-80, 340)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 0 40 l -30 0" />
+    <text x="5" y="20"
+      font-size="12" fill="black"
+      text-anchor="left" dominant-baseline="auto">
+      part
+    </text>
+  </g>
+
+  <g transform="translate(40, 240)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 0 110" />
+    <text x="5" y="55"
+      font-size="12" fill="black"
+      text-anchor="left" dominant-baseline="auto">
+      temporary
+    </text>
+  </g>
+</svg>
diff --git a/src/corelib/doc/images/string_class_calling.svg b/src/corelib/doc/images/string_class_calling.svg
new file mode 100644
index 00000000000..2fcc15bea3d
--- /dev/null
+++ b/src/corelib/doc/images/string_class_calling.svg
@@ -0,0 +1,266 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+  viewBox="-410 -30 540 540"
+  version="1.1"
+  xmlns="http://www.w3.org/2000/svg"
+  xmlns:svg="http://www.w3.org/2000/svg">
+  <defs>
+    <path id="raute"
+      fill="#cfe7f5"
+      stroke="black"
+      stroke-width="1px"
+      d="m 0 -40 L 80 0 L 0 40 L -80 0 z" />
+    <path id="lozenge"
+      fill="#cfe7f5"
+      stroke="black"
+      stroke-width="1px"
+      d="M -60,-20
+         h 120
+         a 20,20 0 0 1 20,20
+         v 0
+         a 20,20 0 0 1 -20,20
+         h -120
+         a 20,20 0 0 1 -20,-20
+         v 0
+         a 20,20 0 0 1 20,-20
+         Z"/>
+    <path id="lozenge_small"
+      fill="#cfe7f5"
+      stroke="black"
+      stroke-width="1px"
+      d="M -40,-20
+         h 80
+         a 20,20 0 0 1 20,20
+         v 0
+         a 20,20 0 0 1 -20,20
+         h -80
+         a 20,20 0 0 1 -20,-20
+         v 0
+         a 20,20 0 0 1 20,-20
+         Z"/>
+    <marker
+      id="triangle"
+      viewBox="0 0 10 10"
+      refX="1"
+      refY="5"
+      markerUnits="strokeWidth"
+      markerWidth="10"
+      markerHeight="10"
+      orient="auto">
+      <path d="M 0 0 L 10 5 L 0 10 z" fill="black" />
+    </marker>
+  </defs>
+
+  <g id="start" transform="translate(-160, 0)">
+    <use href="#lozenge_small" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -6)">
+      <tspan x="0" dy="0em">String class for</tspan>
+      <tspan x="0" dy="1.2em">calling Qt functions</tspan>
+    </text>
+  </g>
+
+  <g id="param_or_return" transform="translate(-160, 100)">
+   <use href="#raute" />
+   <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -12)">
+      <tspan x="0" dy="0em">Is your string</tspan>
+      <tspan x="0" dy="1.2em">known at compile time</tspan>
+      <tspan x="0" dy="1.2em">(a literal)?</tspan>
+  </text>
+  </g>
+
+  <g id="ref_or_perm" transform="translate(-320, 200)">
+    <use href="#raute" />
+     <text
+       font-size="12" fill="black"
+       text-anchor="middle" dominant-baseline="middle"
+       transform="translate(0, -6)">
+       <tspan x="0" dy="0em">Is the parameter a</tspan>
+       <tspan x="0" dy="1.2em">QString or a *View?</tspan>
+  </text>
+  </g>
+
+
+  <g id="ref_or_perm" transform="translate(-320, 330)">
+    <use href="#raute" />
+     <text
+       font-size="12" fill="black"
+       text-anchor="middle" dominant-baseline="middle"
+       transform="translate(0, -6)">
+       <tspan x="0" dy="0em">Do you know the</tspan>
+       <tspan x="0" dy="1.2em">preferred encoding?</tspan>
+  </text>
+  </g>
+
+
+  <g id="make_copy" transform="translate(-100, 330)">
+    <use href="#raute" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -6)">
+      <tspan x="0" dy="0em">Is your string</tspan>
+      <tspan x="0" dy="1.2em">ASCII?</tspan>
+    </text>
+  </g>
+
+  <g transform="translate(40, 150)">
+    <use href="#lozenge" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -4)" >
+      <tspan x="0" dy="0em">QString</tspan>
+      <tspan font-size="8" x="0" dy="1.4em">or what is already existing</tspan>
+    </text>
+  </g>
+
+  <g transform="translate(-100, 200)">
+    <use href="#lozenge" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -4)" >
+      <tspan x="0" dy="0em">QStringLiteral</tspan>
+      <tspan font-size="8" x="0" dy="1.4em">same as u""_s</tspan>
+    </text>
+  </g>
+
+  <g transform="translate(40, 390)">
+    <use href="#lozenge" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -4)" >
+      <tspan x="0" dy="0em">QLatin1StringView</tspan>
+      <tspan font-size="8" x="0" dy="1.4em">same as u""_s</tspan>
+    </text>
+  </g>
+
+  <g transform="translate(-100, 430)">
+    <use href="#lozenge" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -4)" >
+      <tspan x="0" dy="0em">QStringView</tspan>
+      <tspan font-size="8" x="0" dy="1.4em">create with u""</tspan>
+    </text>f
+  </g>
+
+
+  <g transform="translate(-320, 430)">
+    <use href="#lozenge" />
+    <text
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="middle"
+      transform="translate(0, -8)" >
+      <tspan x="0" dy="0em">Q*StringView</tspan>
+      <tspan font-size="8" x="0" dy="1.4em">of the preferred encoding,</tspan>
+      <tspan font-size="8" x="0" dy="1.2em">create with u"", u8"" or ""_L1</tspan>
+    </text>
+  </g>
+
+  <g transform="translate(-160, 20)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 0 30" />
+  </g>
+
+  <g transform="translate(-240, 100)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l -80 0 l 0 50" />
+    <text x="-40" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      yes
+    </text>
+  </g>
+
+  <g transform="translate(-80, 100)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 120 0 l 0 20" />
+    <text x="60" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      no
+    </text>
+  </g>
+
+
+  <g transform="translate(-240, 200)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 50 0 " />
+    <text x="25" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      QString
+    </text>
+  </g>
+
+
+  <g transform="translate(-320, 240)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 0 40 " />
+    <text x="5" y="20"
+      font-size="12" fill="black"
+      text-anchor="left" dominant-baseline="middle">
+      *View
+    </text>
+  </g>
+
+  <g transform="translate(-240, 330)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 50 0" />
+    <text x="30" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      no
+    </text>
+  </g>
+
+  <g transform="translate(-320, 370)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 0 30" />
+    <text x="5" y="15"
+      font-size="12" fill="black"
+      text-anchor="left" dominant-baseline="middle">
+      yes
+    </text>
+  </g>
+
+
+  <g transform="translate(-20, 330)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 60 0 l 0 30" />
+    <text x="30" y="-5"
+      font-size="12" fill="black"
+      text-anchor="middle" dominant-baseline="auto">
+      yes
+    </text>
+  </g>
+
+  <g transform="translate(-100, 370)">
+    <path
+      fill="none" stroke="black" marker-end="url(#triangle)"
+      d="M 0 0 l 0 30" />
+    <text x="5" y="15"
+      font-size="12" fill="black"
+      text-anchor="left" dominant-baseline="middle">
+      no
+    </text>
+  </g>
+
+</svg>
diff --git a/src/corelib/doc/src/qstring-overview.qdoc b/src/corelib/doc/src/qstring-overview.qdoc
new file mode 100644
index 00000000000..7d52b80aec7
--- /dev/null
+++ b/src/corelib/doc/src/qstring-overview.qdoc
@@ -0,0 +1,410 @@
+// Copyright (C) 2025 The Qt Company Ltd.
+// SPDX-License-Identifier: LicenseRef-Qt-Commercial OR GFDL-1.3-no-invariants-only
+
+/*!
+    \group string-processing
+
+    \title Classes for string data
+
+    \section1 Overview
+
+    This page gives an overview over string classes in Qt, in particular the
+    large amount of string containers and how to use them efficiently in
+    performance-critical code.
+
+    The following instructions for efficient use are aimed at experienced
+    developers working on performance-critical code that contains considerable
+    amounts of string processing. This is, for example, a parser or a text file
+    generator. \e {Generally, \l QString can be used in everywhere and it will
+    perform fine.} It also provides APIs for handling several encodings (for
+    example \l{QString::fromLatin1}). For many applications and especially when
+    string-processing plays an insignificant role for performance, \l QString
+    will be a simple and sufficient solution. Some Qt functions return a \l
+    QStringView. It can be converted to a QString with
+    \l{QStringView::}{toString()} if required.
+
+    \section2 Impactful tips
+
+    The following three rules improve string handling substantially without
+    increasing the complexity too much. Follow these rules to get nearly
+    optimal performance in most cases. The first two rules address encoding of
+    string literals and marking them in source code. The third rule addresses
+    deep copies when using parts of a string.
+
+    \list
+
+    \li All strings that only contain ASCII characters (for example log
+    messages) can be encoded with Latin-1. Use the
+    \l{StringLiterals::operator""_L1}{string literal} \c{"foo"_L1}. Without
+    this suffix, strings literals in source code are assumed to be UTF-8
+    encoded and processing them will be slower. Generally, try to use the
+    tightest encoding, which is Latin-1 in many cases.
+
+    \li User-visible strings are usually translated and thus passed through the
+    \l {QObject::tr} function. This function takes a string literal (const char
+    array) and returns a \l QString with UTF-16 encoding as demanded by all UI
+    elements. If the translation infrastructure is not used, you should use
+    UTF-16 encoding throughout the whole application. Use the string literal
+    \c{u"foo"} to create UTF-16 string literals or the Qt specific literal
+    \c{u"foo"_s} to directly create a \l QString.
+
+    \li When processing parts of a \l QString, instead of copying each part
+    into its own \l QString object, create \l QStringView objects instead.
+    These can be converted back to \l QString using
+    \l{QStringView::toString()}, but avoid doing so as much as possible. If
+    functions return \l QStringView, it is most efficient to keep working with
+    this class, if possible. The API is similar to a constant \l QString.
+
+    \endlist
+
+    \section2 Efficient usage
+
+    To use string classes efficiently, one should understand the three concepts
+    of:
+    \list
+      \li Encoding
+      \li Owning and non-owning containers
+      \li Literals
+    \endlist
+
+    \section3 Encoding
+
+    Encoding-wise Qt supports UTF-16, UTF-8, Latin-1 (ISO 8859-1) and US-ASCII
+    (that is the common subset of Latin-1 and UTF-8) in one form or another.
+    \list
+      \li Latin-1 is a character encoding that uses a single byte per character
+          which makes it the most efficient but also limited encoding.
+      \li UTF-8 is a variable-length character encoding that encodes all
+          characters using one to four bytes. It is backwards compatible to
+          US-ASCII and it is the common encoding for source code and similar
+          files.
+      \li UTF-16 is a variable-length encoding that uses two or four bytes per
+          character. It is the common encoding for user-exposed text in Qt.
+    \endlist
+    See the \l{Unicode in Qt}{information about support for Unicode in Qt} for
+    more information.
+
+    Other encodings are supported in the form of single functions like
+    \l{QString::fromUcs4} or of the \l{QStringConverter} classes. Furthermore,
+    Qt provides an encoding-agnostic container for data, \l QByteArray, that is
+    well-suited to storing binary data. \l QAnyStringView keeps track of the
+    encoding of the underlying string and can thus carry a view onto strings
+    with any of the supported encoding standards.
+
+    Converting between encodings is expensive, therefore, avoid if possible. On
+    the other hand, a more compact encoding, particularly for string literals,
+    can reduce binary size, which can increase performance. Where string
+    literals can be expressed in Latin-1, it manages a good compromise between
+    these competing factors, even if it has to be converted to UTF-16 at some
+    point. When a Latin-1 string must be converted to a \l QString, it is done
+    relatively efficiently.
+
+    \section3 Functionality
+
+    String classes can be further distinguished by the functionality they
+    support. One major distinction is whether they own, and thus control, their
+    data or merely reference data held elsewhere. The former are called \e
+    owning containers, the latter \e non-owning containers or views. A
+    non-owning container type typically just records a pointer to the start of
+    the data and its size, making it lightweight and cheap, but it only remains
+    valid as long as the data remains available. An owning string manages the
+    memory in which it stores its data, ensuring that data remains available
+    throughout the lifetime of the container, but its creation and destruction
+    incur the costs of allocating and releasing memory. Views typically support
+    a subset of the functions of the owning string, lacking the possibility to
+    modify the underlying data.
+
+    As a result, string views are particularly well-suited to representing
+    parts of larger strings, for example in a parser, while owning strings are
+    good for persistent storage, such as members of a class. Where a function
+    returns a string that it has constructed, for example by combining
+    fragments, it has to return an owning string; but where a function returns
+    part of some persistently stored string, a view is usually more suitable.
+
+    Note that owning containers in Qt share their data \l{Implicit
+    Sharing}{implicitly}, meaning that it is also efficient to pass or return
+    large containers by value, although slightly less efficient than passing by
+    reference due to the reference counting. If you want to make use of the
+    implicit data sharing mechanism of Qt classes, you have to pass the string
+    as an owning container or a reference to one. Conversion to a view and back
+    will always create an additional copy of the data.
+
+    Finally, Qt provides classes for single characters, lists of strings and
+    string matchers. These classes are available for most supported encoding
+    standards in Qt, with some exceptions. Higher level functionality is
+    provided by specialized classes, such as \l QLocale or \l
+    QTextBoundaryFinder. These high level classes usually rely on \l QString
+    and its UTF-16 encoding. Some classes are templates and work with all
+    available string classes.
+
+    \section3 Literals
+
+    The C++ standard provides
+    \l{https://en.cppreference.com/w/cpp/language/string_literal} {string
+    literals} to create strings at compile-time. There are string literals
+    defined by the language and literals defined by Qt, so-called
+    \l{https://en.cppreference.com/w/cpp/language/user_literal}{user-defined
+    literals}. A string literal defined by C++ is enclosed in double quotes and
+    can have a prefix that tells the compiler how to interpret its content. For
+    Qt, the UTF-16 string literal \c{u"foo"} is the most important. It creates
+    a string encoded in UTF-16 at compile-time, saving the need to convert from
+    some other encoding at run-time. \l QStringView can be easily and
+    efficiently constructed from one, so they can be passed to functions that
+    accept a \l QStringView argument (or, as a result, a \l QAnyStringView).
+
+    User-defined literals have the same form as those defined by C++ but add a
+    suffix after the closing quote. The encoding remains determined by the
+    prefix, but the resulting literal is used to construct an object of some
+    user-defined type. Qt thus defines these for some of its own string types:
+    \c{u"foo"_s} for \c QString, \c{"foo"_L1} for \c QLatin1StringView and
+    \c{u"foo"_ba} for \c QByteArray. These are provided by using the
+    \l{StringLiterals Namespace}. A plain C++ string literal \c{"foo"} will be
+    understood as UTF-8 and conversion to QString and thus UTF-16 will be
+    expensive. When you have string literals in plain ASCII, use \c{"foo"_L1}
+    to interpret it as Latin-1, gaining the various benefits outlined above.
+
+    \section1 Basic string classes
+
+    The following table gives an overview over basic string classes for the
+    various standards of text encoding.
+
+    \table
+    \header
+        \li Encoding
+        \li C++ String literal
+        \li Qt user-defined literal
+        \li C++ Character
+        \li Qt Character
+        \li Owning string
+        \li Non-owning string
+    \row
+        \li Latin-1
+        \li -
+        \li ""_L1
+        \li -
+        \li \l QLatin1Char
+        \li -
+        \li \l QLatin1StringView
+    \row
+        \li UTF-8
+        \li u8""
+        \li -
+        \li char8_t
+        \li -
+        \li -
+        \li \l QUtf8StringView
+    \row
+        \li UTF-16
+        \li u""
+        \li u""_s
+        \li char16_t
+        \li \l QChar
+        \li \l QString
+        \li \l QStringView
+    \row
+        \li Binary/None
+        \li ""
+        \li ""_ba
+        \li -
+        \li std::byte
+        \li \l QByteArray
+        \li \l QByteArrayView
+    \row
+        \li Flexible
+        \li any
+        \li -
+        \li -
+        \li -
+        \li -
+        \li \l QAnyStringView
+    \endtable
+
+    Some of the missing entries can be substituted with built-in and standard
+    library C++ types: An owning Latin-1 or UTF-8 encoded string can be
+    \c{std::string} or any 8-bit \c char array. \l QStringView can also reference
+    any 16-bit character arrays, such as std::u16string or std::wstring on some
+    platforms.
+
+    Qt also provides specialized lists for some of those types, that are \l
+    QStringList and \l QByteArrayView, as well as matchers, \l
+    QLatin1StringMatcher and \l QByteArrayMatcher. The matchers also have
+    static versions that are created at compile-time, \l
+    QStaticLatin1StringMatcher and \l QStaticByteArrayMatcher.
+
+    Further worth noting:
+
+    \list
+
+    \li \l QStringLiteral is a macro which is identical to \c{u"foo"_s} and
+    available without the \l{StringLiterals Namespace}. Preferably you should
+    use the modern string literal.
+
+    \li \l QLatin1String is a synonym for \l QLatin1StringView and exists for
+    backwards compatibility. It is not an owning string and might be removed in
+    future releases.
+
+    \li \l QAnyStringView provides a view for a string with any of the three
+    supported encodings. The encoding is stored alongside the reference to the
+    data. This class is well suited to create interfaces that take a wide
+    spectrum of string types and encodings. In contrast to other classes, no
+    processing is conducted on \l QAnyStringView directly. Processing is
+    conducted on the underlying \l QLatin1StringView, \l QUtf8StringView or
+    \l QStringView in the respective encoding. Use \l QAnyStringView::visit()
+    to do the same in your own functions that take this class as an argument.
+
+    \li A \l QLatin1StringView with non-ASCII characters is not straightforward
+    to construct in a UTF-8 encoded source code file and requires special
+    treatment, see the \l QLatin1StringView documentation.
+
+    \li \l QStringRef is a reference to a portion of a \l QString, available in
+    the Qt5Compat module for backwards compatibility. It should be replaced by
+    \l QStringView.
+
+    \endlist
+
+    \section1 High-level string-related classes
+
+    More high-level classes that provide additional functionality work
+    mostly with \l QString and thus UTF-16. These are:
+
+    \list
+        \li \l QRegularExpression, \l QRegularExpressionMatch and
+            \l QRegularExpressionMatchIterator to work with pattern matching
+            and regular expressions.
+        \li \l QLocale to convert numbers and data to string with respect to
+            the user's language and country.
+        \li \l QCollator and \l QCollatorSortKey to compare strings with
+            respect to the users language, script or territory.
+        \li \l QTextBoundaryFinder to break up text ready for typesetting
+            in accord with Unicode rules.
+        \li \c{QStringBuilder}, an internal class that will substantially
+            improve the performance of string concatenations with the \c{+}
+            operator, see the \l QString documentation.
+    \endlist
+
+    Some classes are templates or have a flexible API and work with various
+    string classes. These are
+
+    \list
+      \li \l QTextStream to stream into \l QIODevice, \l QByteArray or
+          \l QString
+      \li \l QStringTokenizer to split strings
+    \endlist
+
+    \section1 Which string class to use?
+
+    The general guidance in using string classes is:
+    \list
+      \li Avoid copying and memory allocations,
+      \li Avoid encoding conversions, and
+      \li Choose the most compact encoding.
+    \endlist
+
+    Qt provides many functionalities to avoid memory allocations. Most Qt
+    containers employ \l{Implicit Sharing} of their data. For implicit sharing
+    to work, there must be an uninterrupted chain of the same class —
+    converting from \l QString to \l QStringView and back will result in two \l
+    {QString}{QStrings} that do not share their data. Therefore, functions need
+    to pass their data as \l QString (both values or references work).
+    Extracting parts of a string is not possible with implicit data sharing. To
+    use parts of a longer string, make use of string views, an explicit form of
+    data sharing.
+
+    Conversions between encodings can be reduced by sticking to a certain
+    encoding. Data received, for example in UTF-8, is best stored and processed
+    in UTF-8 if no conversation to any other encoding is required. Comparisons
+    between strings of the same encoding are fastest and the same is the case
+    for most other operations. If strings of a certain encoding are often
+    compared or converted to any other encoding it might be beneficial to
+    convert and store them once. Some operations provide many overloads (or a
+    \l QAnyStringView overload) to take various string types and encodings and
+    they should be the second choice to optimize performance, if using the same
+    encoding is not feasible. Explicit encoding conversions before calling a
+    function should be a last resort when no other option is available. Latin-1
+    is a very simple encoding and operation between Latin-1 and any other
+    encoding are almost as efficient as operations between the same encoding.
+
+    The most efficient encoding (from most to least efficient Latin-1, UTF-8,
+    UTF-16) should be chosen when no other constrains determine the encoding.
+    For error handling and logging \l QLatin1StringView is usually sufficient.
+    User-visible strings in Qt are always of type \l {QString} and as such
+    UTF-16 encoded. Therefore it is most effective to use \l
+    {QString}{QStrings}, \l {QStringView}{QStringViews} and \l
+    {QStringLiteral}{QStringLiterals} throughout the life-time of a
+    user-visible string. The \l QObject::tr function provides the correct
+    encoding and type. \l QByteArray should be used if encoding does not play a
+    role, for example to store binary data, or if the encoding is unknown.
+
+    \section2 String class for creating API
+
+    \image string_class_api.svg "String class for an optimal API"
+
+    \section3 Member variables
+
+    Member variables should be of an owning type in nearly all cases. Views can only
+    be used as member variables if the lifetime of the referenced owning string
+    is guaranteed to exceed the lifetime of the object.
+
+    \section3 Function arguments
+
+    Function arguments should be string views of a suitable encoding in most
+    cases. \l QAnyStringView can be used as a parameter to support more than
+    one encoding and \l QAnyStringView::visit can be used internally to fork
+    off into per-encoding functions. If the function is limited to a single
+    encoding, \l QLatin1StringView, \l QUtf8StringView, \l QStringView or \l
+    QByteArrayView should be used.
+
+    If the function saves the argument in an owning string (usually a
+    setter function), it is most efficient to use the same owning string as
+    function argument to make use of the implicit data sharing functionality of
+    Qt. The owning string can be passed as a \c const reference. Overloading
+    functions with multiple owning and non-owning string types can lead to
+    overload ambiguity and should be avoided. Owning string types in Qt can be
+    automatically converted to their non-owning version or to \l
+    QAnyStringView.
+
+    \section3 Return values
+
+    Temporary strings have to be returned as an owning string, usually
+    \l QString. If the returned string is known at compile-time use
+    \c{u"foo"_s} to construct the \l QString structure at compile-time. If
+    existing owning strings (for example \l QString) are returned from a
+    function in full (for example a getter function), it is most efficient to
+    return them by reference. They can also be returned by value to allow
+    returning a temporary in the future. Qt's use of implicit sharing avoids
+    the performance impact of allocation and copying when returning by value.
+
+    Parts of existing strings can be returned efficiently with a string view
+    of the appropriate encoding, for an example see \l
+    QRegularExpressionMatch::capturedView which returns a \l QStringView.
+
+    \section2 String class for using API
+
+    \image string_class_calling.svg "String class for calling a function"
+
+    To use a Qt API efficiently you should try to match the function argument
+    types. If you are limited in your choice, Qt will conduct various
+    conversions: Owning strings are implicitly converted to non-owning
+    strings, non-owning strings can create their owning counter parts,
+    see for example \l QStringView::toString. Encoding conversions are
+    conducted implicitly in many cases but this should be avoided if possible.
+    To avoid accidental implicit conversion from UTF-8 you can activate the
+    macro \l QT_NO_CAST_FROM_ASCII.
+
+    If you need to assemble a string at runtime before passing it to a function
+    you will need an owning string and thus \l QString. If the function
+    argument is \l QStringView or \l QAnyStringView it will be implicitly
+    converted.
+
+    If the string is known at compile-time, there is room for optimization. If
+    the function accepts a \l QString, you should create it with \c{u"foo"_s}
+    or the \l QStringLiteral macro. If the function expects a \l QStringView,
+    it is best constructed with an ordinary UTF-16 string literal \c{u"foo"},
+    if a \l QLatin1StringView is expected, construct it with \c{"foo"_L1}. If
+    you have the choice between both, for example if the function expects \l
+    QAnyStringView, use the tightest encoding, usually Latin-1.
+
+    \section1 List of all string related classes
+*/
+
+// The list is autogenerated by qdoc because this is a group page
diff --git a/src/corelib/doc/src/qtcore-toc.qdoc b/src/corelib/doc/src/qtcore-toc.qdoc
index e3aad63b358..bdaa471413b 100644
--- a/src/corelib/doc/src/qtcore-toc.qdoc
+++ b/src/corelib/doc/src/qtcore-toc.qdoc
@@ -19,7 +19,8 @@
         \list
             \li \l {Event Classes}
         \endlist
-    \li \l{Implicit Sharing}
+    \li \l {Classes for string data}
+    \li \l {Implicit Sharing}
         \list
             \li \l {Implicitly Shared Classes}
         \endlist