From nobody Mon Feb  9 05:04:36 2026
Received: from smtp.kernel.org (aws-us-west-2-korg-mail-1.web.codeaurora.org
 [10.30.226.201])
	(using TLSv1.2 with cipher ECDHE-RSA-AES256-GCM-SHA384 (256/256 bits))
	(No client certificate requested)
	by smtp.subspace.kernel.org (Postfix) with ESMTPS id 0D39F101F2;
	Tue, 28 Jan 2025 00:06:37 +0000 (UTC)
Authentication-Results: smtp.subspace.kernel.org;
 arc=none smtp.client-ip=10.30.226.201
ARC-Seal: i=1; a=rsa-sha256; d=subspace.kernel.org; s=arc-20240116;
	t=1738022797; cv=none;
 b=F15FFFJxhTMK9TW2SHYIFjDeO8L+SZaXtpOGvJcRI05WTYXH2Secoy8bGAzTFgk1/xXl2cbMkGdEHF5e9SRBCPLZ/nQSt33dvE91JtueScwXGKjkvdc+c7KUOCaZ0RbmDgGO+vfEvWY8jMM767eu6lH86YxHIbDNQ2Txs1FIaV8=
ARC-Message-Signature: i=1; a=rsa-sha256; d=subspace.kernel.org;
	s=arc-20240116; t=1738022797; c=relaxed/simple;
	bh=Ig/wrssKDOB8y1m2J/EooG9A8FvmBFRH9/TycqOd21E=;
	h=From:To:Cc:Subject:Date:Message-ID:In-Reply-To:References:
	 MIME-Version;
 b=MsYiH5QrMVOON3qiGKO/E1CQ8FVdROzATsQridnnrcG3GVTEOCD2oW2vvDRbEpC7XEwg2jgohxiPVDX1AY070unuPr6t5zQYIJXmQhNjtDNIXnKDSd2NhgZZUW1HeQWu2maoAewyjQDnMJWaEMQv2ZNJiPeLBvcRqt5dsovQJcM=
ARC-Authentication-Results: i=1; smtp.subspace.kernel.org;
 dkim=pass (2048-bit key) header.d=kernel.org header.i=@kernel.org
 header.b=SVC2MNhR; arc=none smtp.client-ip=10.30.226.201
Authentication-Results: smtp.subspace.kernel.org;
	dkim=pass (2048-bit key) header.d=kernel.org header.i=@kernel.org
 header.b="SVC2MNhR"
Received: by smtp.kernel.org (Postfix) with ESMTPSA id DBBE3C4CEF7;
	Tue, 28 Jan 2025 00:06:35 +0000 (UTC)
DKIM-Signature: v=1; a=rsa-sha256; c=relaxed/simple; d=kernel.org;
	s=k20201202; t=1738022796;
	bh=Ig/wrssKDOB8y1m2J/EooG9A8FvmBFRH9/TycqOd21E=;
	h=From:To:Cc:Subject:Date:In-Reply-To:References:From;
	b=SVC2MNhRvYZRnrULbrk14qiuRYZr+EbHxmhLiw/LKs5FIfJTPakgjzvELglMjFUin
	 hEu/iWJ5DmdFpzLvbdQTQAnwCTYpmcV/Uyc+G1WUfiseqO1ml9tYDw6LKbwTlr482b
	 gFxiNeVJnoVozjE5ii3jjfYi7qwC+GBDrwkUy1yfM5o4Upp72yeN6ZmIpQ2iYlmDIO
	 ggGTZoTsNGtMkNHQCfhhWzYfRKdpqMTtazjGDbHFiHuXUqWz6BOy6NBUX6+iz12YAu
	 5fEGVObZ+qLX7fW/JZ1Nt3SUdcm85cDK9OOtAEAdOpQ8vLntyBsFqZD1QWdRjrXT/l
	 bQN1wXQV9caAw==
Received: from mchehab by mail.kernel.org with local (Exim 4.98)
	(envelope-from <mchehab+huawei@kernel.org>)
	id 1tcZ7i-0000000DRLb-0LCE;
	Tue, 28 Jan 2025 01:06:34 +0100
From: Mauro Carvalho Chehab <mchehab+huawei@kernel.org>
To: Linux Doc Mailing List <linux-doc@vger.kernel.org>,
	Jonathan Corbet <corbet@lwn.net>,
	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Cc: Mauro Carvalho Chehab <mchehab+huawei@kernel.org>,
	"Mauro Carvalho Chehab" <mchehab+huawei@kernel.org>,
	linux-kernel@vger.kernel.org
Subject: [RFC v2 19/38] docs: sphinx/kernel_abi: reduce buffer usage for ABI
 messages
Date: Tue, 28 Jan 2025 01:06:08 +0100
Message-ID: 
 <a883f72c90a51b0355ab220caba9a6f481caf6a3.1738020236.git.mchehab+huawei@kernel.org>
X-Mailer: git-send-email 2.48.1
In-Reply-To: <cover.1738020236.git.mchehab+huawei@kernel.org>
References: <cover.1738020236.git.mchehab+huawei@kernel.org>
Precedence: bulk
X-Mailing-List: linux-kernel@vger.kernel.org
List-Id: <linux-kernel.vger.kernel.org>
List-Subscribe: <mailto:linux-kernel+subscribe@vger.kernel.org>
List-Unsubscribe: <mailto:linux-kernel+unsubscribe@vger.kernel.org>
MIME-Version: 1.0
Content-Transfer-Encoding: quoted-printable
Sender: Mauro Carvalho Chehab <mchehab+huawei@kernel.org>
Content-Type: text/plain; charset="utf-8"

Instead of producing a big message with all ABI contents and then
parse as a whole, simplify the code by handling each ABI symbol
in separate. As an additional benefit, there's no need to place
file/line nubers inlined at the data and use a regex to convert
them.

Signed-off-by: Mauro Carvalho Chehab <mchehab+huawei@kernel.org>
---
 Documentation/sphinx/kernel_abi.py | 76 +++++++++++++++---------------
 scripts/get_abi.py                 | 17 +++----
 2 files changed, 48 insertions(+), 45 deletions(-)

diff --git a/Documentation/sphinx/kernel_abi.py b/Documentation/sphinx/kern=
el_abi.py
index 93d537d8cb6c..025a4f02e1a4 100644
--- a/Documentation/sphinx/kernel_abi.py
+++ b/Documentation/sphinx/kernel_abi.py
@@ -68,6 +68,7 @@ class KernelCmd(Directive):
     has_content =3D False
     final_argument_whitespace =3D True
     logger =3D logging.getLogger('kernel_abi')
+    parser =3D None
=20
     option_spec =3D {
         "debug": directives.flag,
@@ -79,59 +80,60 @@ class KernelCmd(Directive):
             raise self.warning("docutils: file insertion disabled")
=20
         path =3D os.path.join(srctree, "Documentation", self.arguments[0])
-        parser =3D AbiParser(path, logger=3Dself.logger)
-        parser.parse_abi()
-        parser.check_issues()
+        self.parser =3D AbiParser(path, logger=3Dself.logger)
+        self.parser.parse_abi()
+        self.parser.check_issues()
=20
-        msg =3D ""
-        for m in parser.doc(enable_lineno=3DTrue, show_file=3DTrue):
-            msg +=3D m
-
-        node =3D self.nested_parse(msg, self.arguments[0])
+        node =3D self.nested_parse(None, self.arguments[0])
         return node
=20
-    def nested_parse(self, lines, fname):
+    def nested_parse(self, data, fname):
         env =3D self.state.document.settings.env
         content =3D ViewList()
         node =3D nodes.section()
=20
-        if "debug" in self.options:
-            code_block =3D "\n\n.. code-block:: rst\n    :linenos:\n"
-            for line in lines.split("\n"):
-                code_block +=3D "\n    " + line
-            lines =3D code_block + "\n\n"
+        if data is not None:
+            # Handles the .rst file
+            for line in data.split("\n"):
+                content.append(line, fname, 0)
=20
-        line_regex =3D re.compile(r"^\.\. LINENO (\S+)\#([0-9]+)$")
-        ln =3D 0
-        n =3D 0
-        f =3D fname
+            self.do_parse(content, node)
=20
-        for line in lines.split("\n"):
-            n =3D n + 1
-            match =3D line_regex.search(line)
-            if match:
-                new_f =3D match.group(1)
+        else:
+            # Handles the ABI parser content, symbol by symbol
=20
-                # Sphinx parser is lazy: it stops parsing contents in the
-                # middle, if it is too big. So, handle it per input file
-                if new_f !=3D f and content:
-                    self.do_parse(content, node)
-                    content =3D ViewList()
+            old_f =3D fname
+            n =3D 0
+            for msg, f, ln in self.parser.doc():
+                msg_list =3D msg.split("\n")
+                if "debug" in self.options:
+                    lines =3D [
+                        "", "",  ".. code-block:: rst",
+                        "    :linenos:", ""
+                    ]
+                    for m in msg_list:
+                        lines.append("    " + m)
+                else:
+                    lines =3D msg_list
=20
+                for line in lines:
+                    # sphinx counts lines from 0
+                    content.append(line, f, ln - 1)
+                    n +=3D 1
+
+                if f !=3D old_f:
                     # Add the file to Sphinx build dependencies
                     env.note_dependency(os.path.abspath(f))
=20
-                f =3D new_f
+                    old_f =3D f
=20
-                # sphinx counts lines from 0
-                ln =3D int(match.group(2)) - 1
-            else:
-                content.append(line, f, ln)
+                # Sphinx doesn't like to parse big messages. So, let's
+                # add content symbol by symbol
+                if content:
+                    self.do_parse(content, node)
+                    content =3D ViewList()
=20
-        self.logger.info("%s: parsed %i lines" % (fname, n))
-
-        if content:
-            self.do_parse(content, node)
+            self.logger.info("%s: parsed %i lines" % (fname, n))
=20
         return node.children
=20
diff --git a/scripts/get_abi.py b/scripts/get_abi.py
index 3a8dcff85dc2..b57f46b91828 100755
--- a/scripts/get_abi.py
+++ b/scripts/get_abi.py
@@ -441,7 +441,7 @@ class AbiParser:
=20
         return new_desc + "\n\n"
=20
-    def doc(self, enable_lineno=3DFalse, output_in_txt=3DFalse, show_file=
=3DFalse):
+    def doc(self, output_in_txt=3DFalse, show_file=3DTrue):
         """Print ABI at stdout"""
=20
         part =3D None
@@ -458,10 +458,6 @@ class AbiParser:
=20
             msg =3D ""
=20
-            if enable_lineno:
-                ln =3D v.get("line_no", 1)
-                msg +=3D f".. LINENO {file_ref[0][0]}#{ln}\n\n"
-
             if wtype !=3D "File":
                 cur_part =3D names[0]
                 if cur_part.find("/") >=3D 0:
@@ -522,7 +518,9 @@ class AbiParser:
             if users and users.strip(" \t\n"):
                 msg +=3D f"Users:\n\t{users.strip("\n").replace('\n', '\n\=
t')}\n\n"
=20
-            yield msg
+            ln =3D v.get("line_no", 1)
+
+            yield (msg, file_ref[0][0], ln)
=20
     def check_issues(self):
         """Warn about duplicated ABI entries"""
@@ -630,8 +628,11 @@ class AbiRest:
         parser.parse_abi()
         parser.check_issues()
=20
-        for msg in parser.doc(args.enable_lineno, args.raw, not args.no_fi=
le):
-            print(msg)
+        for t in parser.doc(args.raw, not args.no_file):
+            if args.enable_lineno:
+                print (f".. LINENO {t[1]}#{t[2]}\n\n")
+
+            print(t[0])
=20
=20
 class AbiValidate:
--=20
2.48.1