[openwrt/openwrt] musl: add pending patch to fix CFI annotations
LEDE Commits
lede-commits at lists.infradead.org
Mon May 5 04:57:20 PDT 2025
nbd pushed a commit to openwrt/openwrt.git, branch main:
https://git.openwrt.org/edd997a9ee2551e45f69dbc97cac70d404a2817b
commit edd997a9ee2551e45f69dbc97cac70d404a2817b
Author: Felix Fietkau <nbd at nbd.name>
AuthorDate: Mon May 5 11:37:14 2025 +0200
musl: add pending patch to fix CFI annotations
Fixes debugging at least on aarch64, possibly others.
Signed-off-by: Felix Fietkau <nbd at nbd.name>
---
...00-tools-Rework-adding-of-CFI-annotations.patch | 1566 ++++++++++++++++++++
1 file changed, 1566 insertions(+)
diff --git a/toolchain/musl/patches/100-tools-Rework-adding-of-CFI-annotations.patch b/toolchain/musl/patches/100-tools-Rework-adding-of-CFI-annotations.patch
new file mode 100644
index 0000000000..de45743caf
--- /dev/null
+++ b/toolchain/musl/patches/100-tools-Rework-adding-of-CFI-annotations.patch
@@ -0,0 +1,1566 @@
+From: =?UTF-8?q?Ignacy=20Gaw=C4=99dzki?=
+ <ignacy.gawedzki at green-communications.fr>
+Date: Thu, 20 Mar 2025 12:07:21 +0100
+Subject: [PATCH] tools: Rework adding of CFI annotations.
+MIME-Version: 1.0
+Content-Type: text/plain; charset=UTF-8
+Content-Transfer-Encoding: 8bit
+
+Rework awk scripts used to add CFI annotations to i386 and x86_64
+assembly, in order to properly maintain CFA offset across in-function
+jumps.
+
+Add arm and aarch64 versions of these scripts.
+
+Signed-off-by: Ignacy GawÄdzki <ignacy.gawedzki at green-communications.fr>
+---
+ create mode 100644 tools/add-cfi.aarch64.awk
+ create mode 100644 tools/add-cfi.arm.awk
+
+--- /dev/null
++++ b/tools/add-cfi.aarch64.awk
+@@ -0,0 +1,287 @@
++# Insert GAS CFI directives ("control frame information") into AArch64 asm input.
++#
++# CFI directives tell the assembler how to generate "stack frame" debug info.
++# This information can tell a debugger (like gdb) how to find the current stack
++# frame at any point in the program code, and how to find the values which
++# various registers had at higher points in the call stack.
++# With this information, the debugger can show a backtrace, and you can move up
++# and down the call stack and examine the values of local variables.
++
++BEGIN {
++ # Don't put CFI data in the .eh_frame ELF section (which we don't keep).
++ print ".cfi_sections .debug_frame"
++
++ # Only emit CFI directives inside a function.
++ in_function = ""
++
++ # Emit .loc directives with line numbers from original source.
++ printf ".file 1 \"%s\"\n", ARGV[1]
++ line_number = 0
++
++ re_label = "([0-9+|[a-zA-Z_][a-zA-Z0-9_]*)"
++
++ # Build an associative array of canonical register names.
++ for (i = 0; i < 30; ++i)
++ regname["x" i] = regname["w" i] = "x" i
++ regname["x30"] = regname["w30"] = regname["lr"] = "x30"
++ regname["xzr"] = regname["wzr"] = "xzr"
++ regname["sp"] = regname["wsp"] = "sp"
++}
++
++{
++ ++line_number
++
++ # Clean the input up before doing anything else.
++ # Delete comments.
++ gsub(/^#.*|\/\/.*|\/\*.*\*\//, "")
++
++ # Canonicalize whitespace.
++ gsub(/[ \t]+/, " ") # Mawk doesn't understand \s.
++ gsub(/ *, */, ",")
++ gsub(/ *: */, ": ")
++ gsub(/ $/, "")
++ gsub(/^ /, "")
++}
++
++# Check for assembler directives which we care about.
++/^\.(section|data|text)/ {
++ # A .cfi_startproc/.cfi_endproc pair should be within the same section
++ # otherwise, clang will choke when generating ELF output.
++ if (in_function) {
++ print ".cfi_endproc"
++ in_function = ""
++ }
++}
++
++# Record each function name.
++/^\.type [a-zA-Z0-9_]+( STT_FUNCTION|,[#@%"]function)/ {
++ functions[substr($2, 1, length($2) - 10)] = 1
++}
++
++# Not interested in assembler directives beyond this, just pass them through.
++/^\./ {
++ print
++ next
++}
++
++# Helper to adjust CFA offset.
++function adjust_sp_offset(delta) {
++ if (in_function) {
++ printf ".cfi_adjust_cfa_offset %d\n", delta
++ cfa_offset[in_function] += delta
++ }
++}
++
++# Helper to invalidate unsaved register.
++function trashed(reg) {
++ if (in_function && !(reg in saved) && !(reg in dirty))
++ printf ".cfi_undefined %s\n", reg
++ dirty[reg] = 1
++}
++
++# Helper to process jumps to labels by saving the current CFA offset.
++function jump_to_label(label) {
++ if (in_function) {
++ if (match(label, /^[0-9]+f$/)) # "forward" label
++ cfa_offset[substr(label, 1, RLENGTH - 1)] = cfa_offset[in_function]
++ else if (match(label, /^[a-zA-Z_][a-zA-Z0-9_]*$/))
++ cfa_offset[label] = cfa_offset[in_function]
++ }
++}
++
++# Helper to set relative offset of registers pushed on the stack.
++function push_regs(regs, numregs, i) {
++ adjust_sp_offset(numregs * 4)
++ for (i = 1; i <= numregs; ++i) {
++ reg = regname[regs[i]]
++ if (!(reg in saved) && !(reg in dirty)) {
++ printf ".cfi_rel_offset %s,%i\n", reg, ((i - 1) * 4)
++ saved[reg] = 1
++ }
++ }
++}
++
++# Helper to invalidate unsaved registers popped from the stack.
++function pop_regs(regs, numregs, i) {
++ adjust_sp_offset(numregs * -4)
++ for (i = 1; i <= numregs; ++i) {
++ reg = regname[regs[i]]
++ trashed(reg)
++ }
++}
++
++# Helper to save a single register saved in SP-relative locations.
++function save_reg(reg, offset) {
++ reg = regname[reg]
++ if (!(reg in saved) && !(reg in dirty)) {
++ printf ".cfi_rel_offset %s,%d\n", reg, offset
++ saved[reg] = 1
++ }
++}
++
++# Process labels.
++$0 ~ "^" re_label ":" {
++ # Parse each leading label.
++ while (match($0, "^" re_label ":")) {
++
++ # Extract label name.
++ label = substr($1, 1, RLENGTH - 1)
++
++ # Remove label from current line.
++ sub("^" re_label ": ?", "")
++
++ if (label in functions) {
++ if (in_function) {
++ print ".cfi_endproc"
++ for (l in called)
++ delete called[l]
++ }
++
++ in_function = label
++ print ".cfi_startproc"
++
++ for (reg in saved)
++ delete saved[reg]
++ for (reg in dirty)
++ delete dirty[reg]
++ }
++
++ printf "%s:\n", label
++
++ # If this label has been jumped to, define the CFA offset to its
++ # value at the location of the jump.
++ if (!(label in functions) && in_function && label in cfa_offset) {
++ if (cfa_offset[in_function] != cfa_offset[label]) {
++ printf ".cfi_def_cfa_offset %d\n", cfa_offset[label]
++ cfa_offset[in_function] = cfa_offset[label]
++ }
++ delete cfa_offset[label]
++ }
++
++ # If this label has been called, possibly invalidate LR.
++ if (label in called && !(label in functions)) {
++ trashed("lr")
++ delete called[label]
++ }
++ }
++ # An instruction may follow on the same line, so continue processing.
++}
++
++# Skip empty line.
++/^$/ { next }
++
++# Issue source line number.
++{
++ printf ".loc 1 %d\n", line_number
++ print
++}
++
++# Process jumps to label (using B*).
++/^b[^xrl]/ {
++ jump_to_label($2)
++}
++
++# Process jumps to label (using [CT]BN?Z).
++/^[ct]bn?z / {
++ if (match($2, /,.+$/))
++ jump_to_label(substr($2, RSTART + 1, RLENGTH - 1))
++}
++
++# Issue relative offsets of registers stored in SP-relative locations.
++/^st(n?p|r[bh]?|l[lu]?r|tr|ur) .+,\[(sp|x30)[,\]]/ {
++ if (in_function) {
++ if (match($2, /(,#?[+-]?(0x[0-9a-fA-F]+|[0-9]+))?\]$/)) {
++ # Offset with no write-back.
++ if (RLENGTH == 1)
++ offset = 0
++ else
++ offset = parse_const(substr($2, RSTART + 2, RLENGTH - 3))
++ split($2, operands, ",")
++ if (match($1, /^stn?p$/)) {
++ if (match(operands[1], /^x/)) {
++ save_reg(operands[1], offset)
++ save_reg(operands[2], offset + 8)
++ }
++ } else if (match(operands[1], /x^/))
++ save_reg(operands[1], offset)
++ } else if (match($2, /,#?[+-]?(0x[0-9a-fA-F]+|[0-9]+)\]!$/)) {
++ # Pre-index with write-back.
++ offset = parse_const(substr($2, RSTART + 2, RLENGTH - 4))
++ adjust_sp_offset(-offset)
++ split($2, operands, ",")
++ if ($1 == "stp") {
++ if (match(operands[1], /^x/)) {
++ save_reg(operands[1], 0)
++ save_reg(operands[2], 8)
++ }
++ } else if (match(operands[1], /^x/))
++ save_reg(operands[1], 0)
++ } else if (match($2, /,#?[+-]?(0x[0-9a-fA-F]+|[0-9]+)$/)) {
++ # Post-index
++ offset = parse_const(substr($2, RSTART + 2, RLENGTH - 2))
++ split($2, operands, ",")
++ if ($1 == "stp") {
++ if (match(operands[1], /^x/)) {
++ save_reg(operands[1], 0)
++ save_reg(operands[2], 8)
++ }
++ } else if (match(operands[1], /^x/))
++ save_reg(operands[1], 0)
++ adjust_sp_offset(-offset)
++ }
++ }
++}
++
++# Adjust CFA offset when decreasing SP.
++/subs?(\.[nw])? sp,sp,/ {
++ if (in_function && match($2, /,#[+-]?(0x[0-9a-fA-F]+|[0-9]+)$/))
++ adjust_sp_offset(parse_const(substr($2, RSTART + 2, RLENGTH - 2)))
++}
++
++# Adjust CFA offset when increasing SP.
++/adds?(\.[nw])? sp,sp,/ {
++ if (in_function && match($2, /,#[+-]?(0x[0-9a-fA-F]+|[0-9]+)$/))
++ adjust_sp_offset(-parse_const(substr($2, RSTART + 2, RLENGTH - 2)))
++}
++
++# Process calls to labels.
++/bl[a-z]* / {
++ if (match($2, /^[0-9]+f$/)) # "forward" label
++ called[substr($2, 1, RLENGTH - 1)] = 1
++ else if (match($2, /^[a-zA-Z_][0-9a-zA-Z_]*$/))
++ called[$2] = 1
++}
++
++# Invalidate unsaved registers being written to.
++/^(adcs?|adds?|adrp?|ands?|asrv?|bfc|bfi|bfm|bfxil|bics?|cin[cv]|cl[sz]|cneg|crc32[a-z]+|csel|csetm?|csin[cv]|csneg|eo[nr]|extr|ldap(r[bh]?|ur(s?[bhw]?))|ldar[bh]?|ldax[pr][bh]?|ldlar[bh]?|ldr((aa)?|s?[bhw])|ldtrs?[bhw]?|ldurs?[bhw]?|ldxr[bh]?|ls[lr]v?|madd|mneg|mov[knz]?|mrs|msub|mul|mvn|negs?|ngcs?|orn|orr|pac[a-z0-9]+|rbit|rev(16|32)?|rorv?|sbcs?|sbfiz|sbfm|sbfx|sdiv|smaddl|smnegl|smsubl|smul[hl]|subs?|sxt[bhw]|sysl|ubfiz|ubfm|ubfx|udiv|umaddl|umnegl|umsubl|umul[hl]|uxt[bhw]) ([xw]([ [...]
++ split($2, args, ",")
++ reg = args[1]
++ if (reg != "sp")
++ trashed(regname[reg])
++}
++
++# Invalidate unsaved registers being written to by atomic operations in memory.
++/^ld(add|clr|eor|set|[su](max|min))/ {
++ split($2, args, ",")
++ trashed(regname[args[2]])
++}
++
++# Invalidate unsaved registers being written to by pair loading.
++/^ld[nx]p(sw)? / {
++ split($2, args, ",")
++ trashed(regname[args[1]])
++ trashed(regname[args[2]])
++}
++
++# Invalidate unsaved registers being written to by long instructions.
++/^(smlals?|smlal(bb|bt|tb|tt)|smlaldx?|smlsldx?|smull|umaal|umlal|umulls?) / {
++ split($2, args, ",")
++ trashed(regname[args[1]])
++ trashed(regname[args[2]])
++}
++
++END {
++ # Issue end of function if still inside one.
++ if (in_function)
++ print ".cfi_endproc"
++}
+--- /dev/null
++++ b/tools/add-cfi.arm.awk
+@@ -0,0 +1,367 @@
++# Insert GAS CFI directives ("control frame information") into ARM asm input.
++#
++# CFI directives tell the assembler how to generate "stack frame" debug info.
++# This information can tell a debugger (like gdb) how to find the current stack
++# frame at any point in the program code, and how to find the values which
++# various registers had at higher points in the call stack.
++# With this information, the debugger can show a backtrace, and you can move up
++# and down the call stack and examine the values of local variables.
++
++BEGIN {
++ # Don't put CFI data in the .eh_frame ELF section (which we don't keep).
++ print ".cfi_sections .debug_frame"
++
++ # Only emit CFI directives inside a function.
++ in_function = ""
++
++ # Emit .loc directives with line numbers from original source.
++ printf ".file 1 \"%s\"\n", ARGV[1]
++ line_number = 0
++
++ re_label = "([0-9+|[a-zA-Z_][a-zA-Z0-9_]*)"
++
++ # Build an associative array of canonical register names.
++ for (i = 0; i < 10; ++i) {
++ regname["r" i] = "r" i
++ regnum["r" i] = i
++ }
++ regname["r10"] = regname["sl"] = "r10"
++ regnum["r10"] = regnum["sl"] = 10
++ regname["r11"] = regname["fp"] = "r11"
++ regnum["r11"] = regnum["fp"] = 11
++ regname["r12"] = regname["ip"] = "r12"
++ regnum["r12"] = regnum["ip"] = 12
++ regname["r13"] = regname["sp"] = "r13"
++ regnum["r13"] = regnum["sp"] = 13
++ regname["r14"] = regname["lr"] = "r14"
++ regnum["r14"] = regnum["lr"] = 14
++ regname["r15"] = regname["pc"] = "r15"
++ regnum["r15"] = regnum["pc"] = 15
++}
++
++{
++ ++line_number
++
++ # Clean the input up before doing anything else.
++ # Delete comments.
++ gsub(/(^#|@|\/\/).*|\/\*.*\*\//, "")
++
++ # Canonicalize whitespace.
++ gsub(/[ \t]+/, " ") # Mawk doesn't understand \s.
++ gsub(/ *, */, ",")
++ gsub(/ *: */, ": ")
++ gsub(/ $/, "")
++ gsub(/^ /, "")
++}
++
++# Check for assembler directives which we care about.
++/^\.(section|data|text)/ {
++ # A .cfi_startproc/.cfi_endproc pair should be within the same section
++ # otherwise, clang will choke when generating ELF output.
++ if (in_function) {
++ print ".cfi_endproc"
++ in_function = ""
++ }
++}
++
++# Record each function name.
++/^\.type [a-zA-Z0-9_]+( STT_FUNCTION|,[#@%"]function)/ {
++ functions[substr($2, 1, length($2) - 10)] = 1
++}
++
++# Not interested in assembler directives beyond this, just pass them through.
++/^\./ {
++ print
++ next
++}
++
++# Helper to adjust CFA offset.
++function adjust_sp_offset(delta) {
++ if (in_function) {
++ printf ".cfi_adjust_cfa_offset %d\n", delta
++ cfa_offset[in_function] += delta
++ }
++}
++
++# Helper to invalidate unsaved register.
++function trashed(reg) {
++ if (in_function && !(reg in saved) && !(reg in dirty))
++ printf ".cfi_undefined %s\n", reg
++ dirty[reg] = 1
++}
++
++# Helper to process jumps to labels by saving the current CFA offset.
++function jump_to_label(label) {
++ if (in_function) {
++ if (match(label, /^[0-9]+f$/)) # "forward" label
++ cfa_offset[substr(label, 1, RLENGTH - 1)] = cfa_offset[in_function]
++ else if (match(label, /^[a-zA-Z_][a-zA-Z0-9_]*$/))
++ cfa_offset[label] = cfa_offset[in_function]
++ }
++}
++
++# Helper to save a single register saved in SP-relative locations.
++function save_reg(reg, offset) {
++ reg = regname[reg]
++ if (!(reg in saved) && !(reg in dirty)) {
++ printf ".cfi_rel_offset %s,%d\n", reg, offset
++ saved[reg] = 1
++ }
++}
++
++# Helper to save registers relative to SP.
++function save_regs(regs, numregs, i) {
++ for (i = 1; i <= numregs; ++i)
++ save_reg(regname[regs[i]], (i - 1) * -4)
++}
++
++# Helper to set relative offset of registers pushed on the stack.
++function push_regs(regs, numregs, i) {
++ adjust_sp_offset(numregs * 4)
++ for (i = 1; i <= numregs; ++i)
++ save_reg(regname[regs[i]], (i - 1) * 4)
++}
++
++# Helper to invalidate unsaved registers popped from the stack.
++function pop_regs(regs, numregs, i) {
++ adjust_sp_offset(numregs * -4)
++ for (i = 1; i <= numregs; ++i) {
++ reg = regname[regs[i]]
++ trashed(reg)
++ }
++}
++
++# Helper to parse register lists.
++function split_reglist(arg, regs, num, toks, tmp, dash, i, j) {
++ while (match(arg, /^{[^}]+}/)) {
++ num = split(substr(arg, RSTART + 1, RLENGTH - 2), toks, ",")
++ for (i = 1; i <= num; ++i)
++ if (match(toks[i], /^r([0-9]|1[0-5])-r([0-9]|1[0-5])$/)) {
++ dash = index(toks[i], "-")
++ first = 0 + substr(toks[i], 2, dash - 2)
++ last = 0 + substr(toks[i], dash + 2)
++ for (j = first; j <= last; ++j)
++ tmp[j]
++ } else
++ tmp[regnum[toks[i]]]
++ arg = substr(arg, RSTART + RLENGTH)
++ if (!match(arg, /^[\t ]*[+|][\t ]*/))
++ break
++ arg = substr(arg, RLENGTH + 1)
++ }
++ num = 0
++ for (i = 0; i < 16; ++i) {
++ if (!(i in tmp))
++ continue
++ regs[++num] = regname["r" i]
++ }
++ return num
++}
++
++# Process labels.
++$0 ~ "^" re_label ":" {
++ # Parse each leading label.
++ while (match($0, "^" re_label ":")) {
++
++ # Extract label name.
++ label = substr($1, 1, RLENGTH - 1)
++
++ # Remove label from current line.
++ sub("^" re_label ": ?", "")
++
++ if (label in functions) {
++ if (in_function) {
++ print ".cfi_endproc"
++ for (l in called)
++ delete called[l]
++ }
++
++ in_function = label
++ print ".cfi_startproc"
++
++ for (reg in saved)
++ delete saved[reg]
++ for (reg in dirty)
++ delete dirty[reg]
++ }
++
++ printf "%s:\n", label
++
++ # If this label has been jumped to, define the CFA offset to its
++ # value at the location of the jump.
++ if (!(label in functions) && in_function && label in cfa_offset) {
++ if (cfa_offset[in_function] != cfa_offset[label]) {
++ printf ".cfi_def_cfa_offset %d\n", cfa_offset[label]
++ cfa_offset[in_function] = cfa_offset[label]
++ }
++ delete cfa_offset[label]
++ }
++
++ # If this label has been called, possibly invalidate LR.
++ if (label in called && !(label in functions)) {
++ trashed("lr")
++ delete called[label]
++ }
++ }
++ # An instruction may follow on the same line, so continue processing.
++}
++
++# Skip empty line.
++/^$/ { next }
++
++# Issue source line number.
++{
++ printf ".loc 1 %d\n", line_number
++ print
++}
++
++# Process jumps to label (using B*).
++/^b[^xl]/ {
++ jump_to_label($2)
++}
++
++# Process jumps to label (using CBNZ?).
++/^cbnz? / {
++ if (match($2, /,.*$/))
++ jump_to_label(substr($2, RSTART + 1, RLENGTH - 1))
++}
++
++# Adjust CFA offset and issue relative offsets of pushed registers using PUSH.
++/^push / {
++ if (in_function) {
++ numregs = split_reglist($2, regs)
++ push_regs(regs, numregs);
++ }
++}
++
++# Adjust CFA offset and Issue relative offsets of pushed registers using STMFD.
++/^stm(fd|db)(al)?(\.[nw])? (sp|r13)!,/ {
++ if (in_function) {
++ numregs = split_reglist(substr($2, index($2, ",") + 1), regs)
++ push_regs(regs, numregs);
++ }
++}
++
++/^stm(ia|ea)?(al)?(\.[nw])? (sp|r13),/ {
++ if (in_function) {
++ numregs = split_reglist(substr($2, index($2, ",") + 1), regs)
++ save_regs(regs, numregs);
++ }
++}
++
++# Adjust CFA offset and invalidate unsaved registers popped using POP.
++/^pop / {
++ if (in_function) {
++ numregs = split_reglist($2, regs)
++ pop_regs(regs, numregs)
++ }
++}
++
++# Adjust CFA offset and invalidate unsaved registers popped using LDMFD.
++/^ldm(fd|ia)(al)?(\.[nw])? (sp|r13)!,/ {
++ if (in_function) {
++ numregs = split_reglist(substr($2, index($2, ",") + 1), regs)
++ pop_regs(regs, numregs)
++ }
++}
++
++# Issue relative offsets of registers stored in SP-relative locations.
++/^str[a-z.]* .*,\[(sp|r13)[,\]]/ {
++ if (in_function && !match($1, /^str(ex)?[bh]/)) {
++ if (match($2, /(,#[+-]?(0x[0-9a-fA-F]+|[0-9]+))?\]$/)) {
++ # Offset with no write-back.
++ if (RLENGTH == 1)
++ offset = 0
++ else
++ offset = parse_const(substr($2, RSTART + 2, RLENGTH - 3))
++ split($2, operands, ",")
++ if (match($1, /^str(ex)?d/)) {
++ save_reg(operands[1], offset)
++ save_reg(operands[2], offset + 4)
++ } else
++ save_reg(operands[1], offset)
++ } else if (match($2, /,#[+-]?(0x[0-9a-fA-F]+|[0-9]+)\]!$/)) {
++ # Pre-index with write-back.
++ offset = parse_const(substr($2, RSTART + 2, RLENGTH - 4))
++ adjust_sp_offset(-offset)
++ split($2, operands, ",")
++ if (match($1, /^str(ex)?d/)) {
++ save_reg(operands[1], 0)
++ save_reg(operands[2], 4)
++ } else
++ save_reg(operands[1], 0)
++ } else if (match($2, /,#[+-]?(0x[0-9a-fA-F]+|[0-9]+)$/)) {
++ # Post-index
++ offset = parse_const(substr($2, RSTART + 2, RLENGTH - 2))
++ split($2, operands, ",")
++ if (match($1, /^str(ex)?d/)) {
++ save_reg(operands[1], 0)
++ save_reg(operands[2], 4)
++ } else
++ save_reg(operands[1], 0)
++ adjust_sp_offset(-offset)
++ }
++ }
++}
++
++# Adjust CFA offset when decreasing SP.
++/subs?(al)?(\.[nw])? (sp|r13),(sp|r13),/ {
++ if (in_function && match($2, /,#[+-]?(0x[0-9a-fA-F]+|[0-9]+)$/))
++ adjust_sp_offset(parse_const(substr($2, RSTART + 2, RLENGTH - 2)))
++}
++
++# Adjust CFA offset when increasing SP.
++/adds?(al)?(\.[nw])? (sp|r13),(sp|r13),/ {
++ if (in_function && match($2, /,#[+-]?(0x[0-9a-fA-F]+|[0-9]+)$/))
++ adjust_sp_offset(-parse_const(substr($2, RSTART + 2, RLENGTH - 2)))
++}
++
++# Process calls to labels.
++/bl[a-z]* / {
++ if (match($2, /^[0-9]+f$/)) # "forward" label
++ called[substr($2, 1, RLENGTH - 1)] = 1
++ else if (match($2, /^[a-zA-Z_][0-9a-zA-Z_]*$/))
++ called[$2] = 1
++}
++
++# Invalidate unsaved registers being written to.
++/^((adc|add|and|asr|adr|bic|eor|lsl|lsr|mla|mov|mul|mvn|orn|orr|ror|rrx|rsb|rsc|sbc|sub)s?|bfc|bfi|clz|cpy|ldr[a-z]*|mls||movt|mrs|neg|pkh(bt|tb)|qadd(8|16)?|qasx|qdadd|qdsub|qsax|qsub(8|16)?|rbit|rev(16)?|revsh|sadd(16|8)|sasx|sbfx|sdiv|sel|shadd(16|8)|shasx|shsax|shsub(16|8)|smla(bb|bt|tb|tt)|smladx?|smlaw[tb]|smlsdx?|smmlar?|smlsr?|smmulr?|smuadx?|smul(bb|bt|tb|tt)|smulw[bt]|smusdx?|ssat(16)?|ssax|ssub(16|8)|swpb?|sxtab(16)?|sxtah|sxtb(16)?|sxth|sxtb(16)?|sxth|uadd(16|8)|uasx|ubfx|ud [...]
++ split($2, args, ",")
++ reg = args[1]
++ if (reg != "sp")
++ trashed(regname[reg])
++}
++
++# Invalidate unsaved registers being written to by long instructions.
++/^(smlals?|smlal(bb|bt|tb|tt)|smlaldx?|smlsldx?|smull|umaal|umlal|umulls?)/ {
++ split($2, args, ",")
++ trashed(regname[args[1]])
++ trashed(regname[args[2]])
++}
++
++# Invalidate unsaved register being modified by write-back on store multiple.
++/^stm[a-z.]* [^,]+!,/ {
++ first_arg = substr($2, 1, index($2, ",") - 1)
++ if (!match(first_arg, /^(sp|r13)/))
++ trashed(regname[substr(first_arg, 1, length(first_arg) - 1)])
++}
++
++# Invalidate unsaved registers being modified by load multiple.
++/^ldm[a-z.]* [^,]+,{.*}$/ {
++ comma = index($2, ",")
++ first_arg = substr($2, 1, comma - 1)
++ other_args = substr($2, comma + 1)
++ if (!match(first_arg, /^(sp|r13)/)) {
++ if (match(first_arg, /!$/))
++ trashed(regname[substr(first_arg, 1, RSTART - 1)])
++ numregs = split_reglist(other_args, regs)
++ for (i = 1; i <= numregs; ++i)
++ trashed(regname[regs[i]])
++ }
++}
++
++END {
++ # Issue end of function if still inside one.
++ if (in_function)
++ print ".cfi_endproc"
++}
+--- a/tools/add-cfi.common.awk
++++ b/tools/add-cfi.common.awk
+@@ -1,26 +1,46 @@
+-function hex2int(str, i) {
++function hex2int(str, i) {
+ str = tolower(str)
+
+ for (i = 1; i <= 16; i++) {
+ char = substr("0123456789abcdef", i, 1)
+- lookup[char] = i-1
++ lookup[char] = i - 1
+ }
+
+ result = 0
+ for (i = 1; i <= length(str); i++) {
+- result = result * 16
+- char = substr(str, i, 1)
+- result = result + lookup[char]
++ result *= 16
++ char = substr(str, i, 1)
++ result += lookup[char]
++ }
++ return result
++}
++
++function oct2int(str, i) {
++ str = tolower(str)
++
++ for (i = 1; i <= 8; ++i) {
++ char = substr("01234567", i, 1)
++ lookup[char] = i - 1
++ }
++
++ result = 0
++ for (i = 1; i <= length(str); ++i) {
++ result *= 8
++ char = substr(str, i, 1)
++ result += lookup[char]
+ }
+ return result
+ }
+
+ function parse_const(str) {
+- sign = sub(/^-/, "", str)
+- hex = sub(/^0x/, "", str)
++ neg = sub(/^-/, "", str)
++ oct = match(str, /^0[0-7]/)
++ hex = sub(/^0x/, "", str)
+ if (hex)
+ n = hex2int(str)
++ else if (oct)
++ n = oct2int(str)
+ else
+ n = str+0
+- return sign ? -n : n
++ return neg? -n: n
+ }
+--- a/tools/add-cfi.i386.awk
++++ b/tools/add-cfi.i386.awk
+@@ -1,123 +1,179 @@
+-# Insert GAS CFI directives ("control frame information") into x86-32 asm input
++# Insert GAS CFI directives ("control frame information") into x86-32 asm input.
+ #
+-# CFI directives tell the assembler how to generate "stack frame" debug info
++# CFI directives tell the assembler how to generate "stack frame" debug info.
+ # This information can tell a debugger (like gdb) how to find the current stack
+ # frame at any point in the program code, and how to find the values which
+-# various registers had at higher points in the call stack
++# various registers had at higher points in the call stack.
+ # With this information, the debugger can show a backtrace, and you can move up
+-# and down the call stack and examine the values of local variables
++# and down the call stack and examine the values of local variables.
+
+ BEGIN {
+- # don't put CFI data in the .eh_frame ELF section (which we don't keep)
++ # Don't put CFI data in the .eh_frame ELF section (which we don't keep).
+ print ".cfi_sections .debug_frame"
+
+- # only emit CFI directives inside a function
+- in_function = 0
++ # Only emit CFI directives inside a function.
++ in_function = ""
+
+- # emit .loc directives with line numbers from original source
++ # Emit .loc directives with line numbers from original source.
+ printf ".file 1 \"%s\"\n", ARGV[1]
+ line_number = 0
+
+- # used to detect "call label; label:" trick
+- called = ""
++ re_label = "([0-9]+|[a-zA-Z_][a-zA-Z0-9_]*)"
++
++ for (i = 1; i <= 4; ++i) {
++ letter = substr("abcd", i, 1)
++ regname[letter "l"] = regname[letter "h"] = regname[letter "x"] = \
++ regname["e" letter "x"] = "e" letter "x"
++ }
++
++ regname["si"] = regname["esi"] = "esi"
++ regname["di"] = regname["edi"] = "edi"
++ regname["bp"] = regname["ebp"] = "ebp"
++ regname["sp"] = regname["esp"] = "esp"
+ }
+
++# For instructions with 2 operands, get 1st operand (assuming it is constant).
+ function get_const1() {
+- # for instructions with 2 operands, get 1st operand (assuming it is constant)
+- match($0, /-?(0x[0-9a-fA-F]+|[0-9]+),/)
+- return parse_const(substr($0, RSTART, RLENGTH-1))
++ match($2, /^\$[+-]?(0x[0-9a-fA-F]+|[0-9]+),/)
++ return parse_const(substr($2, 2, RLENGTH - 2))
+ }
+
+-function canonicalize_reg(register) {
+- if (match(register, /^e/))
+- return register
+- else if (match(register, /[hl]$/)) # AH, AL, BH, BL, etc
+- return "e" substr(register, 1, 1) "x"
+- else # AX, BX, CX, etc
+- return "e" register
+-}
++# Only use if you already know there is 1 and only 1 register.
+ function get_reg() {
+- # only use if you already know there is 1 and only 1 register
+- match($0, /%e?([abcd][hlx]|si|di|bp)/)
+- return canonicalize_reg(substr($0, RSTART+1, RLENGTH-1))
++ return regname[substr($2, 2, length($2) - 1)]
+ }
++
++# For instructions with 2 operands, get 1st operand (assuming it is register).
+ function get_reg1() {
+- # for instructions with 2 operands, get 1st operand (assuming it is register)
+- match($0, /%e?([abcd][hlx]|si|di|bp),/)
+- return canonicalize_reg(substr($0, RSTART+1, RLENGTH-2))
++ match($2, /^%e?([abcd][hlx]|si|di|bp),/)
++ return regname[substr($2, 2, RLENGTH - 2)]
+ }
++
++# For instructions with 2 operands, get 2nd operand (assuming it is register).
+ function get_reg2() {
+- # for instructions with 2 operands, get 2nd operand (assuming it is register)
+- match($0, /,%e?([abcd][hlx]|si|di|bp)/)
+- return canonicalize_reg(substr($0, RSTART+2, RLENGTH-2))
++ match($2, /,%e?([abcd][hlx]|si|di|bp)$/)
++ return regname[substr($2, RSTART + 2, RLENGTH - 2)]
+ }
+
++# Helper to adjust CFA offset.
+ function adjust_sp_offset(delta) {
+- if (in_function)
++ if (in_function) {
+ printf ".cfi_adjust_cfa_offset %d\n", delta
++ cfa_offset[in_function] += delta
++ }
++}
++
++function save_reg(reg, offset) {
++ if (!(reg in saved) && !(reg in dirty)) {
++ printf ".cfi_rel_offset %s,%d\n", reg, offset
++ saved[reg] = 1
++ }
++}
++
++# Helper to process jumps to labels by saving the current CFA offset.
++function jump_to_label(label) {
++ if (in_function) {
++ if (match(label, /^[0-9]+f$/)) # "forward" label
++ cfa_offset[substr(label, 1, RLENGTH - 1)] = cfa_offset[in_function]
++ else if (match(label, /^[a-zA-Z_][a-zA-Z0-9_]*$/))
++ cfa_offset[label] = cfa_offset[in_function]
++ }
+ }
+
+ {
+- line_number = line_number + 1
++ ++line_number
+
+- # clean the input up before doing anything else
+- # delete comments
+- gsub(/(#|\/\/).*/, "")
++ # Clean the input up before doing anything else.
++ # Delete comments.
++ gsub(/#.*|\/\*.*\*\//, "")
+
+- # canonicalize whitespace
+- gsub(/[ \t]+/, " ") # mawk doesn't understand \s
++ # Canonicalize whitespace.
++ gsub(/[ \t]+/, " ") # Mawk doesn't understand \s.
+ gsub(/ *, */, ",")
+ gsub(/ *: */, ": ")
++ gsub(/%cs: */, "%cs:")
++ gsub(/%ds: */, "%ds:")
++ gsub(/%ss: */, "%ss:")
++ gsub(/%es: */, "%es:")
++ gsub(/%fs: */, "%fs:")
++ gsub(/%gs: */, "%gs:")
+ gsub(/ $/, "")
+ gsub(/^ /, "")
+ }
+
+-# check for assembler directives which we care about
++# Check for assembler directives which we care about.
+ /^\.(section|data|text)/ {
+- # a .cfi_startproc/.cfi_endproc pair should be within the same section
+- # otherwise, clang will choke when generating ELF output
++ # A .cfi_startproc/.cfi_endproc pair should be within the same section.
++ # Otherwise, clang will choke when generating ELF output.
+ if (in_function) {
+ print ".cfi_endproc"
+- in_function = 0
++ in_function = ""
+ }
+ }
+-/^\.type [a-zA-Z0-9_]+, at function/ {
+- functions[substr($2, 1, length($2)-10)] = 1
++
++# Record each function name.
++/^\.type [a-zA-Z0-9_]+( STT_FUNCTION|,[#@%"]function)/ {
++ functions[substr($2, 1, length($2) - 10)] = 1
+ }
+-# not interested in assembler directives beyond this, just pass them through
++
++# Not interested in assembler directives beyond this, just pass them through.
+ /^\./ {
+ print
+ next
+ }
+
+-/^[a-zA-Z0-9_]+:/ {
+- label = substr($1, 1, length($1)-1) # drop trailing :
+-
+- if (called == label) {
+- # note adjustment of stack pointer from "call label; label:"
+- adjust_sp_offset(4)
+- }
++$0 ~ "^" re_label ":" {
++ # Parse each leading label.
++ while (match($0, "^" re_label ":")) {
++
++ # Extract label name.
++ label = substr($1, 1, RLENGTH - 1)
++
++ # Remove label from current line.
++ sub("^" re_label ": ?", "")
++
++ if (label in functions) {
++ if (in_function) {
++ print ".cfi_endproc"
++ for (l in called)
++ delete called[l]
++ }
++
++ in_function = label
++ print ".cfi_startproc"
++
++ for (reg in saved)
++ delete saved[reg]
++ for (reg in dirty)
++ delete dirty[reg]
++ }
+
+- if (functions[label]) {
+- if (in_function)
+- print ".cfi_endproc"
++ printf "%s:\n", label
+
+- in_function = 1
+- print ".cfi_startproc"
++ # If this label has been jumped to, define the CFA offset to its
++ # value at the location of the jump.
++ if (!(label in functions) && in_function && label in cfa_offset) {
++ if (cfa_offset[in_function] != cfa_offset[label]) {
++ printf ".cfi_def_cfa_offset %d\n", cfa_offset[label]
++ cfa_offset[in_function] = cfa_offset[label]
++ }
++ delete cfa_offset[label]
++ }
+
+- for (register in saved)
+- delete saved[register]
+- for (register in dirty)
+- delete dirty[register]
++ # If this label has been called, adjust CFA offset.
++ if (label in called && !(label in functions)) {
++ adjust_sp_offset(4);
++ delete called[label]
++ }
+ }
+-
+- # an instruction may follow on the same line, so continue processing
++ # An instruction may follow on the same line, so continue processing.
+ }
+
++# Skip empty line.
+ /^$/ { next }
+
++# Issue source line number.
+ {
+- called = ""
+ printf ".loc 1 %d\n", line_number
+ print
+ }
+@@ -126,82 +182,145 @@ function adjust_sp_offset(delta) {
+ # We do NOT attempt to understand foolish and ridiculous tricks like stashing
+ # the stack pointer and then using %esp as a scratch register, or bitshifting
+ # it or taking its square root or anything stupid like that.
+-# %esp should only be adjusted by pushing/popping or adding/subtracting constants
++# %esp should only be adjusted by pushing/popping or adding/subtracting
++# constants.
+ #
+-/pushl?/ {
+- if (match($0, / %(ax|bx|cx|dx|di|si|bp|sp)/))
++/^push[wl]? / {
++ if ($1 == "pushw" || match($2, /^%([abcd]x|di|si|bp|sp)$/))
+ adjust_sp_offset(2)
+ else
+ adjust_sp_offset(4)
+ }
+-/popl?/ {
+- if (match($0, / %(ax|bx|cx|dx|di|si|bp|sp)/))
++
++/^pop[wl]? / {
++ if ($1 == "popw" || match($2, /^%([abcd]x|di|si|bp|sp)$/))
+ adjust_sp_offset(-2)
+ else
+ adjust_sp_offset(-4)
+ }
+-/addl? \$-?(0x[0-9a-fA-F]+|[0-9]+),%esp/ { adjust_sp_offset(-get_const1()) }
+-/subl? \$-?(0x[0-9a-fA-F]+|[0-9]+),%esp/ { adjust_sp_offset(get_const1()) }
+
+-/call/ {
+- if (match($0, /call [0-9]+f/)) # "forward" label
+- called = substr($0, RSTART+5, RLENGTH-6)
+- else if (match($0, /call [0-9a-zA-Z_]+/))
+- called = substr($0, RSTART+5, RLENGTH-5)
++/^pushal?$/ {
++ adjust_sp_offset(32)
++ if (in_function) {
++ save_reg("eax", 28)
++ save_reg("ecx", 24)
++ save_reg("edx", 20)
++ save_reg("ebx", 16)
++ save_reg("esp", 12)
++ save_reg("ebp", 8)
++ save_reg("esi", 4)
++ save_reg("edi", 0)
++ }
++}
++
++/^pushaw$/ {
++ adjust_sp_offset(16)
++}
++
++/^popal?$/ {
++ adjust_sp_offset(-32)
++}
++
++/^popaw$/ {
++ adjust_sp_offset(-16)
++}
++
++/^pushfl?$/ {
++ adjust_sp_offset(4)
++}
++
++/^pushfw$/ {
++ adjust_sp_offset(2)
++}
++
++/^popfl?$/ {
++ adjust_sp_offset(-4)
++}
++
++/^popfw$/ {
++ adjust_sp_offset(-2)
++}
++
++/^addl? \$[+-]?(0x[0-9a-fA-F]+|[0-9]+),%esp/ {
++ adjust_sp_offset(-get_const1())
++}
++
++/^subl? \$[+-]?(0x[0-9a-fA-F]+|[0-9]+),%esp/ {
++ adjust_sp_offset(get_const1())
++}
++
++/^call / {
++ if (match($2, /^[0-9]+f$/)) # "forward" label
++ called[substr($2, 1, RLENGTH - 1)] = 1
++ else if (match($2, /^[a-zA-Z_][0-9a-zA-Z_]*$/))
++ called[$2] = 1
++}
++
++/^j/ {
++ jump_to_label($2)
+ }
+
+ # TRACKING REGISTER VALUES FROM THE PREVIOUS STACK FRAME
+ #
+-/pushl? %e(ax|bx|cx|dx|si|di|bp)/ { # don't match "push (%reg)"
+- # if a register is being pushed, and its value has not changed since the
++/^pushl? %e([abcd]x|si|di|bp)$/ {
++ # Don't match "push (%reg)"
++ # If a register is being pushed, and its value has not changed since the
+ # beginning of this function, the pushed value can be used when printing
+- # local variables at the next level up the stack
+- # emit '.cfi_rel_offset' for that
++ # local variables at the next level up the stack.
++ # Emit '.cfi_rel_offset' for that.
+
+- if (in_function) {
+- register = get_reg()
+- if (!saved[register] && !dirty[register]) {
+- printf ".cfi_rel_offset %s,0\n", register
+- saved[register] = 1
+- }
+- }
++ if (in_function)
++ save_reg(get_reg(), 0)
+ }
+
+-/movl? %e(ax|bx|cx|dx|si|di|bp),-?(0x[0-9a-fA-F]+|[0-9]+)?\(%esp\)/ {
++/^movl? %e(ax|bx|cx|dx|si|di|bp),[+-]?(0x[0-9a-fA-F]+|[0-9]+)?\(%esp\)$/ {
+ if (in_function) {
+- register = get_reg()
+- if (match($0, /-?(0x[0-9a-fA-F]+|[0-9]+)\(%esp\)/)) {
+- offset = parse_const(substr($0, RSTART, RLENGTH-6))
++ if (match($2, /,[+-]?(0x[0-9a-fA-F]+|[0-9]+)\(%esp\)$/)) {
++ offset = parse_const(substr($2, RSTART + 1, RLENGTH - 7))
+ } else {
+ offset = 0
+ }
+- if (!saved[register] && !dirty[register]) {
+- printf ".cfi_rel_offset %s,%d\n", register, offset
+- saved[register] = 1
+- }
++ save_reg(get_reg1(), offset)
+ }
+ }
+
+ # IF REGISTER VALUES ARE UNCEREMONIOUSLY TRASHED
+ # ...then we want to know about it.
+ #
+-function trashed(register) {
+- if (in_function && !saved[register] && !dirty[register]) {
+- printf ".cfi_undefined %s\n", register
+- }
+- dirty[register] = 1
+-}
+-# this does NOT exhaustively check for all possible instructions which could
+-# overwrite a register value inherited from the caller (just the common ones)
+-/mov.*,%e?([abcd][hlx]|si|di|bp)$/ { trashed(get_reg2()) }
+-/(add|addl|sub|subl|and|or|xor|lea|sal|sar|shl|shr).*,%e?([abcd][hlx]|si|di|bp)$/ {
++function trashed(reg) {
++ if (in_function && !(reg in saved) && !(reg in dirty)) {
++ printf ".cfi_undefined %s\n", reg
++ dirty[reg] = 1
++ }
++}
++# This does NOT exhaustively check for all possible instructions which could
++# overwrite a register value inherited from the caller (just the common ones).
++/^mov.*,%e?([abcd][hlx]|si|di|bp)$/ {
++ trashed(get_reg2())
++}
++/^(add|sub|and|x?or|lea|s[ah][lr])[bwl]? [^,]+,%e?([abcd][hlx]|si|di|bp)$/ {
+ trashed(get_reg2())
+ }
+-/^i?mul [^,]*$/ { trashed("eax"); trashed("edx") }
+-/^i?mul.*,%e?([abcd][hlx]|si|di|bp)$/ { trashed(get_reg2()) }
+-/^i?div/ { trashed("eax"); trashed("edx") }
+-/(dec|inc|not|neg|pop) %e?([abcd][hlx]|si|di|bp)/ { trashed(get_reg()) }
+-/cpuid/ { trashed("eax"); trashed("ebx"); trashed("ecx"); trashed("edx") }
++/^i?mul[bwl] [^,]+$/ {
++ trashed("eax")
++ trashed("edx")
++}
++/^i?mul[bwl]? [^,]+,%e?([abcd][hlx]|si|di|bp)$/ {
++ trashed(get_reg2())
++}
++/^i?div / {
++ trashed("eax")
++ trashed("edx")
++}
++/^(dec|inc|not|neg|pop)[bwl]? %e?([abcd][hlx]|si|di|bp)$/ {
++ trashed(get_reg())
++}
++/^cpuid/ {
++ trashed("eax")
++ trashed("ebx")
++ trashed("ecx")
++ trashed("edx")
++}
+
+ END {
+ if (in_function)
+--- a/tools/add-cfi.x86_64.awk
++++ b/tools/add-cfi.x86_64.awk
+@@ -1,169 +1,246 @@
+-# Insert GAS CFI directives ("control frame information") into x86-64 asm input
++# Insert GAS CFI directives ("control frame information") into x86-64 asm input.
+
+ BEGIN {
+- # don't put CFI data in the .eh_frame ELF section (which we don't keep)
++ # Don't put CFI data in the .eh_frame ELF section (which we don't keep).
+ print ".cfi_sections .debug_frame"
+
+- # only emit CFI directives inside a function
+- in_function = 0
++ # Only emit CFI directives inside a function.
++ in_function = ""
+
+- # emit .loc directives with line numbers from original source
++ # Emit .loc directives with line numbers from original source.
+ printf ".file 1 \"%s\"\n", ARGV[1]
+ line_number = 0
+
+- # used to detect "call label; label:" trick
+- called = ""
++ re_label = "([0-9]+|[a-zA-Z_][a-zA-Z0-9_]*)"
++
++ for (i = 1; i <= 4; ++i) {
++ letter = substr("abcd", i, 1)
++ regname[letter "l"] = regname[letter "h"] = regname[letter "x"] = \
++ regname["e" letter "x"] = regname["r" letter "x"] = "r" letter "x"
++ }
++
++ regname["si"] = regname["esi"] = regname["rsi"] = "rsi"
++ regname["di"] = regname["edi"] = regname["rdi"] = "rdi"
++ regname["bp"] = regname["ebp"] = regname["rbp"] = "rbp"
++ regname["sp"] = regname["esp"] = regname["rsp"] = "rsp"
++
++ for (i = 8; i <= 15; ++i)
++ regname["r" i] = "r" i
+ }
+
++# For instructions with 2 operands, get 1st operand (assuming it is constant).
+ function get_const1() {
+- # for instructions with 2 operands, get 1st operand (assuming it is constant)
+- match($0, /-?(0x[0-9a-fA-F]+|[0-9]+),/)
+- return parse_const(substr($0, RSTART, RLENGTH-1))
++ match($2, /^\$[+-]?(0x[0-9a-fA-F]+|[0-9]+),/)
++ return parse_const(substr($2, 2, RLENGTH - 2))
+ }
+
+-function canonicalize_reg(register) {
+- if (match(register, /^r/))
+- return register
+- else if (match(register, /^e/))
+- return "r" substr(register, 2, length(register)-1)
+- else if (match(register, /[hl]$/)) # AH, AL, BH, BL, etc
+- return "r" substr(register, 1, 1) "x"
+- else # AX, BX, CX, etc
+- return "r" register
+-}
++# Only use if you already know there is 1 and only 1 register.
+ function get_reg() {
+- # only use if you already know there is 1 and only 1 register
+- match($0, /%[er]?([abcd][xlh]|si|di|bp|8|9|10|11|12|13|14|15)/)
+- return canonicalize_reg(substr($0, RSTART+1, RLENGTH-1))
++ return regname[substr($2, 2, length($2) - 1)]
+ }
++
++# For instructions with 2 operands, get 1st operand (assuming it is register).
+ function get_reg1() {
+- # for instructions with 2 operands, get 1st operand (assuming it is register)
+- match($0, /%[er]?([abcd][xlh]|si|di|bp|8|9|10|11|12|13|14|15),/)
+- return canonicalize_reg(substr($0, RSTART+1, RLENGTH-2))
++ match($2, /^%[er]?([abcd][xlh]|si|di|bp|[89]|1[0-5]),/)
++ return regname[substr($2, 2, RLENGTH - 2)]
+ }
++
++# For instructions with 2 operands, get 2nd operand (assuming it is register).
+ function get_reg2() {
+- # for instructions with 2 operands, get 2nd operand (assuming it is register)
+- match($0, /,%[er]?([abcd][xlh]|si|di|bp|8|9|10|11|12|13|14|15)/)
+- return canonicalize_reg(substr($0, RSTART+2, RLENGTH-2))
++ match($2, /,%[er]?([abcd][xlh]|si|di|bp|[89]|1[0-5])$/)
++ return regname[substr($2, RSTART + 2, RLENGTH - 2)]
+ }
+
++# Helper to adjust CFA offset.
+ function adjust_sp_offset(delta) {
+- if (in_function)
++ if (in_function) {
+ printf ".cfi_adjust_cfa_offset %d\n", delta
++ cfa_offset[in_function] += delta
++ }
++}
++
++# Helper to process jumps to labels by saving the current CFA offset.
++function jump_to_label(label) {
++ if (in_function) {
++ if (match(label, /^[0-9]+f$/)) # "forward" label
++ cfa_offset[substr(label, 1, RLENGTH - 1)] = cfa_offset[in_function]
++ else if (match(label, /^[a-zA-Z_][a-zA-Z0-9_]*$/))
++ cfa_offset[label] = cfa_offset[in_function]
++ }
+ }
+
+ {
+- line_number = line_number + 1
++ ++line_number
+
+- # clean the input up before doing anything else
+- # delete comments
+- gsub(/(#|\/\/).*/, "")
++ # Clean the input up before doing anything else.
++ # Delete comments.
++ gsub(/#.*|\/\*.*\*\//, "")
+
+- # canonicalize whitespace
+- gsub(/[ \t]+/, " ") # mawk doesn't understand \s
++ # Canonicalize whitespace.
++ gsub(/[ \t]+/, " ") # Mawk doesn't understand \s.
+ gsub(/ *, */, ",")
+ gsub(/ *: */, ": ")
+ gsub(/ $/, "")
+ gsub(/^ /, "")
+ }
+
+-# check for assembler directives which we care about
++# Check for assembler directives which we care about.
+ /^\.(section|data|text)/ {
+- # a .cfi_startproc/.cfi_endproc pair should be within the same section
+- # otherwise, clang will choke when generating ELF output
++ # A .cfi_startproc/.cfi_endproc pair should be within the same section.
++ # Otherwise, clang will choke when generating ELF output.
+ if (in_function) {
+ print ".cfi_endproc"
+- in_function = 0
++ in_function = ""
+ }
+ }
+-/^\.type [a-zA-Z0-9_]+, at function/ {
+- functions[substr($2, 1, length($2)-10)] = 1
++
++# Record each function name.
++/^\.type [a-zA-Z0-9_]+( STT_FUNCTION|,[#@%"]function)/ {
++ functions[substr($2, 1, length($2) - 10)] = 1
+ }
+-# not interested in assembler directives beyond this, just pass them through
++# Not interested in assembler directives beyond this, just pass them through.
+ /^\./ {
+ print
+ next
+ }
+
+-/^[a-zA-Z0-9_]+:/ {
+- label = substr($1, 1, length($1)-1) # drop trailing :
+-
+- if (called == label) {
+- # note adjustment of stack pointer from "call label; label:"
+- adjust_sp_offset(8)
+- }
++$0 ~ "^" re_label ":" {
++ # Parse each leading label.
++ while (match($0, "^" re_label ":")) {
++
++ # Extract label name.
++ label = substr($1, 1, RLENGTH - 1)
++
++ # Remove label from current line.
++ sub("^" re_label ": ?", "")
++
++ if (label in functions) {
++ if (in_function) {
++ print ".cfi_endproc"
++ for (l in called)
++ delete called[l]
++ }
++
++ in_function = label
++ print ".cfi_startproc"
++
++ for (reg in saved)
++ delete saved[reg]
++ for (reg in dirty)
++ delete dirty[reg]
++ }
+
+- if (functions[label]) {
+- if (in_function)
+- print ".cfi_endproc"
++ printf "%s:\n", label
+
+- in_function = 1
+- print ".cfi_startproc"
++ # If this label has been jumped to, define the CFA offset to its
++ # value at the location of the jump.
++ if (!(label in functions) && in_function && label in cfa_offset) {
++ if (cfa_offset[in_function] != cfa_offset[label]) {
++ printf ".cfi_def_cfa_offset %d\n", cfa_offset[label]
++ cfa_offset[in_function] = cfa_offset[label]
++ }
++ delete cfa_offset[label]
++ }
+
+- for (register in saved)
+- delete saved[register]
+- for (register in dirty)
+- delete dirty[register]
++ # If this label has been called, adjust CFA offset.
++ if (label in called && !(label in functions)) {
++ adjust_sp_offset(8);
++ delete called[label]
++ }
+ }
+-
+- # an instruction may follow on the same line, so continue processing
++ # An instruction may follow on the same line, so continue processing.
+ }
+
++# Skip empty line.
+ /^$/ { next }
+
++# Issue source line number.
+ {
+- called = ""
+ printf ".loc 1 %d\n", line_number
+ print
+ }
+
+ # KEEPING UP WITH THE STACK POINTER
+-# %rsp should only be adjusted by pushing/popping or adding/subtracting constants
++# %rsp should only be adjusted by pushing/popping or adding/subtracting
++# constants.
+ #
+-/pushl?/ {
++/^push[wq]? / {
++ if ($1 == "pushw" || match($2, /^%([abcd]x|di|si|bp|sp)$/))
++ adjust_sp_offset(2)
++ else
++ adjust_sp_offset(8)
++}
++
++/^pop[wq]? / {
++ if ($1 == "popw" || match($2, /^%([abcd]x|di|si|bp|sp)$/))
++ adjust_sp_offset(-2)
++ else
++ adjust_sp_offset(-8)
++}
++
++/^pushfq?$/ {
+ adjust_sp_offset(8)
+ }
+-/popl?/ {
++
++/^pushfw$/ {
++ adjust_sp_offset(2)
++}
++
++/^popfq?$/ {
+ adjust_sp_offset(-8)
+ }
+-/addl? \$-?(0x[0-9a-fA-F]+|[0-9]+),%rsp/ { adjust_sp_offset(-get_const1()) }
+-/subl? \$-?(0x[0-9a-fA-F]+|[0-9]+),%rsp/ { adjust_sp_offset(get_const1()) }
+
+-/call/ {
+- if (match($0, /call [0-9]+f/)) # "forward" label
+- called = substr($0, RSTART+5, RLENGTH-6)
+- else if (match($0, /call [0-9a-zA-Z_]+/))
+- called = substr($0, RSTART+5, RLENGTH-5)
++/^popfw$/ {
++ adjust_sp_offset(-2)
++}
++
++/^addq? \$[+-]?(0x[0-9a-fA-F]+|[0-9]+),%rsp$/ {
++ adjust_sp_offset(-get_const1())
++}
++/^subq? \$[+-]?(0x[0-9a-fA-F]+|[0-9]+),%rsp$/ {
++ adjust_sp_offset(get_const1())
++}
++
++/^call / {
++ if (match($2, /^[0-9]+f$/)) # "forward" label
++ called[substr($2, 1, RLENGTH - 1)] = 1
++ else if (match($2, /^[a-zA-Z_][0-9a-zA-Z_]*$/))
++ called[$2] = 1
++}
++
++/^j/ {
++ jump_to_label($2)
+ }
+
+ # TRACKING REGISTER VALUES FROM THE PREVIOUS STACK FRAME
+ #
+-/pushl? %r(ax|bx|cx|dx|si|di|bp|8|9|10|11|12|13|14|15)/ { # don't match "push (%reg)"
+- # if a register is being pushed, and its value has not changed since the
++/^pushq? %r([abcd]x|si|di|bp|[89]|1[0-5])$/ {
++ # Don't match "push (%reg)".
++ # If a register is being pushed, and its value has not changed since the
+ # beginning of this function, the pushed value can be used when printing
+- # local variables at the next level up the stack
+- # emit '.cfi_rel_offset' for that
++ # local variables at the next level up the stack.
++ # Emit '.cfi_rel_offset' for that.
+
+ if (in_function) {
+- register = get_reg()
+- if (!saved[register] && !dirty[register]) {
+- printf ".cfi_rel_offset %s,0\n", register
+- saved[register] = 1
++ reg = get_reg()
++ if (!(reg in saved) && !(reg in dirty)) {
++ printf ".cfi_rel_offset %s,0\n", reg
++ saved[reg] = 1
+ }
+ }
+ }
+
+-/movl? %r(ax|bx|cx|dx|si|di|bp|8|9|10|11|12|13|14|15),-?(0x[0-9a-fA-F]+|[0-9]+)?\(%rsp\)/ {
++/^movq? %r([abcd]x|si|di|bp|[89]|1[0-5]),[+-]?(0x[0-9a-fA-F]+|[0-9]+)?\(%rsp\)$/ {
+ if (in_function) {
+- register = get_reg()
+- if (match($0, /-?(0x[0-9a-fA-F]+|[0-9]+)\(%rsp\)/)) {
+- offset = parse_const(substr($0, RSTART, RLENGTH-6))
++ if (match($2, /,[+-]?(0x[0-9a-fA-F]+|[0-9]+)\(%rsp\)$/)) {
++ offset = parse_const(substr($2, RSTART, RLENGTH - 7))
+ } else {
+ offset = 0
+ }
+- if (!saved[register] && !dirty[register]) {
+- printf ".cfi_rel_offset %s,%d\n", register, offset
+- saved[register] = 1
++ reg = get_reg1()
++ if (!(reg in saved) && !(reg in dirty)) {
++ printf ".cfi_rel_offset %s,%d\n", reg, offset
++ saved[reg] = 1
+ }
+ }
+ }
+@@ -171,24 +248,41 @@ function adjust_sp_offset(delta) {
+ # IF REGISTER VALUES ARE UNCEREMONIOUSLY TRASHED
+ # ...then we want to know about it.
+ #
+-function trashed(register) {
+- if (in_function && !saved[register] && !dirty[register]) {
+- printf ".cfi_undefined %s\n", register
+- }
+- dirty[register] = 1
+-}
+-# this does NOT exhaustively check for all possible instructions which could
+-# overwrite a register value inherited from the caller (just the common ones)
+-/mov.*,%[er]?([abcd][xlh]|si|di|bp|8|9|10|11|12|13|14|15)$/ { trashed(get_reg2()) }
+-/(add|addl|sub|subl|and|or|xor|lea|sal|sar|shl|shr).*,%[er]?([abcd][xlh]|si|di|bp|8|9|10|11|12|13|14|15)$/ {
++function trashed(reg) {
++ if (in_function && !(reg in saved) && !(reg in dirty)) {
++ printf ".cfi_undefined %s\n", reg
++ }
++ dirty[reg] = 1
++}
++# This does NOT exhaustively check for all possible instructions which could
++# overwrite a register value inherited from the caller (just the common ones).
++/^mov.*,%[er]?([abcd][xlh]|si|di|bp|[89]|1[0-5])$/ {
++ trashed(get_reg2())
++}
++/^(add|sub|and|x?or|lea|s[ah][lr])[bwlq]? [^,]+,%[er]?([abcd][xlh]|si|di|bp|[89]|1[0-5])$/ {
+ trashed(get_reg2())
+ }
+-/^i?mul [^,]*$/ { trashed("rax"); trashed("rdx") }
+-/^i?mul.*,%[er]?([abcd][xlh]|si|di|bp|8|9|10|11|12|13|14|15)$/ { trashed(get_reg2()) }
+-/^i?div/ { trashed("rax"); trashed("rdx") }
++/^i?mul[bwlq]? [^,]+$/ {
++ trashed("rax")
++ trashed("rdx")
++}
++/^i?mul[bwlq] [^,]+,%[er]?([abcd][xlh]|si|di|bp|[89]|1[0-5])$/ {
++ trashed(get_reg2())
++}
++/^i?div[bwlq]? / {
++ trashed("rax")
++ trashed("rdx")
++}
+
+-/(dec|inc|not|neg|pop) %[er]?([abcd][xlh]|si|di|bp|8|9|10|11|12|13|14|15)/ { trashed(get_reg()) }
+-/cpuid/ { trashed("rax"); trashed("rbx"); trashed("rcx"); trashed("rdx") }
++/^(dec|inc|not|neg|pop)[bwlq]? %[er]?([abcd][xlh]|si|di|bp|[89]|1[0-5])$/ {
++ trashed(get_reg())
++}
++/^cpuid$/ {
++ trashed("rax")
++ trashed("rbx")
++ trashed("rcx")
++ trashed("rdx")
++}
+
+ END {
+ if (in_function)
More information about the lede-commits
mailing list