scripts: Some minor regex cleanup

Just trying to make regex in scripts a bit more consistent. Though regex being regex this may be fruitless.
2025-12-01 12:20:02 +00:00 · 2024-12-04 01:02:50 -06:00
parent 28d89eb009
commit b90b2953ea
6 changed files with 42 additions and 44 deletions
--- a/scripts/perfbd.py
+++ b/scripts/perfbd.py
@ -352,22 +352,21 @@ def collect_dwarf_lines(obj_path, *,
        objdump_path=OBJDUMP_PATH,
        **args):
    line_pattern = re.compile(
-            '^\s*(?:'
-                # matches dir/file table
-                '(?P<no>[0-9]+)'
+            # matches dir/file table
+            '^\s*(?P<no>[0-9]+)'
                    '(?:\s+(?P<dir>[0-9]+))?'
-                    '.*\s+(?P<path>[^\s]+)'
+                    '.*\s+(?P<path>[^\s]+)\s*$'
                # matches line opcodes
-                '|' '\[[^\]]*\]\s+' '(?:'
-                    '(?P<op_special>Special)'
-                    '|' '(?P<op_copy>Copy)'
-                    '|' '(?P<op_end>End of Sequence)'
-                    '|' 'File .*?to (?:entry )?(?P<op_file>\d+)'
-                    '|' 'Line .*?to (?P<op_line>[0-9]+)'
-                    '|' '(?:Address|PC) .*?to (?P<op_addr>[0x0-9a-fA-F]+)'
-                    '|' '.'
-                ')*'
-            ')\s*$', re.IGNORECASE)
+                '|' '^\s*\[[^\]]*\]' '(?:'
+                    '\s+(?P<op_special>Special)'
+                        '|' '\s+(?P<op_copy>Copy)'
+                        '|' '\s+(?P<op_end>End of Sequence)'
+                        '|' '\s+File.*?to.*?(?P<op_file>[0-9]+)'
+                        '|' '\s+Line.*?to.*?(?P<op_line>[0-9]+)'
+                        '|' '\s+(?:Address|PC)'
+                            '\s+.*?to.*?(?P<op_addr>[0xX0-9a-fA-F]+)'
+                        '|' '\s+[^\s]+' ')+\s*$',
+            re.IGNORECASE)

    # state machine for dwarf line numbers, note that objdump's
    # decodedline seems to have issues with multiple dir/file