root/tools/perf/util/genelf_debug.c
// SPDX-License-Identifier: GPL-2.0-only
/*
 * genelf_debug.c
 * Copyright (C) 2015, Google, Inc
 *
 * Contributed by:
 *      Stephane Eranian <eranian@google.com>
 *
 * based on GPLv2 source code from Oprofile
 * @remark Copyright 2007 OProfile authors
 * @author Philippe Elie
 */
#include <linux/compiler.h>
#include <linux/zalloc.h>
#include <sys/types.h>
#include <stdio.h>
#include <getopt.h>
#include <stddef.h>
#include <libelf.h>
#include <string.h>
#include <stdlib.h>
#include <inttypes.h>
#include <limits.h>
#include <fcntl.h>
#include <err.h>
#include <dwarf.h>

#include "genelf.h"
#include "../util/jitdump.h"

#define BUFFER_EXT_DFL_SIZE     (4 * 1024)

typedef uint32_t uword;
typedef uint16_t uhalf;
typedef int32_t  sword;
typedef int16_t  shalf;
typedef uint8_t  ubyte;
typedef int8_t   sbyte;

struct buffer_ext {
        size_t cur_pos;
        size_t max_sz;
        void *data;
};

static void
buffer_ext_dump(struct buffer_ext *be, const char *msg)
{
        size_t i;
        warnx("DUMP for %s", msg);
        for (i = 0 ; i < be->cur_pos; i++)
                warnx("%4zu 0x%02x", i, (((char *)be->data)[i]) & 0xff);
}

static inline int
buffer_ext_add(struct buffer_ext *be, void *addr, size_t sz)
{
        void *tmp;
        size_t be_sz = be->max_sz;

retry:
        if ((be->cur_pos + sz) < be_sz) {
                memcpy(be->data + be->cur_pos, addr, sz);
                be->cur_pos += sz;
                return 0;
        }

        if (!be_sz)
                be_sz = BUFFER_EXT_DFL_SIZE;
        else
                be_sz <<= 1;

        tmp = realloc(be->data, be_sz);
        if (!tmp)
                return -1;

        be->data   = tmp;
        be->max_sz = be_sz;

        goto retry;
}

static void
buffer_ext_init(struct buffer_ext *be)
{
        be->data = NULL;
        be->cur_pos = 0;
        be->max_sz = 0;
}

static void
buffer_ext_exit(struct buffer_ext *be)
{
        zfree(&be->data);
}

static inline size_t
buffer_ext_size(struct buffer_ext *be)
{
        return be->cur_pos;
}

static inline void *
buffer_ext_addr(struct buffer_ext *be)
{
        return be->data;
}

struct debug_line_header {
        // Not counting this field
        uword total_length;
        // version number (2 currently)
        uhalf version;
        // relative offset from next field to
        // program statement
        uword prolog_length;
        ubyte minimum_instruction_length;
        ubyte default_is_stmt;
        // line_base - see DWARF 2 specs
        sbyte line_base;
        // line_range - see DWARF 2 specs
        ubyte line_range;
        // number of opcode + 1
        ubyte opcode_base;
        /* follow the array of opcode args nr: ubytes [nr_opcode_base] */
        /* follow the search directories index, zero terminated string
         * terminated by an empty string.
         */
        /* follow an array of { filename, LEB128, LEB128, LEB128 }, first is
         * the directory index entry, 0 means current directory, then mtime
         * and filesize, last entry is followed by en empty string.
         */
        /* follow the first program statement */
} __packed;

/* DWARF 2 spec talk only about one possible compilation unit header while
 * binutils can handle two flavours of dwarf 2, 32 and 64 bits, this is not
 * related to the used arch, an ELF 32 can hold more than 4 Go of debug
 * information. For now we handle only DWARF 2 32 bits comp unit. It'll only
 * become a problem if we generate more than 4GB of debug information.
 */
struct compilation_unit_header {
        uword total_length;
        uhalf version;
        uword debug_abbrev_offset;
        ubyte pointer_size;
} __packed;

#define DW_LNS_num_opcode (DW_LNS_set_isa + 1)

/* field filled at run time are marked with -1 */
static struct debug_line_header const default_debug_line_header = {
        .total_length = -1,
        .version = 2,
        .prolog_length = -1,
        .minimum_instruction_length = 1,        /* could be better when min instruction size != 1 */
        .default_is_stmt = 1,   /* we don't take care about basic block */
        .line_base = -5,        /* sensible value for line base ... */
        .line_range = -14,     /* ... and line range are guessed statically */
        .opcode_base = DW_LNS_num_opcode
};

static ubyte standard_opcode_length[] =
{
        0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1
};
#if 0
{
        [DW_LNS_advance_pc]   = 1,
        [DW_LNS_advance_line] = 1,
        [DW_LNS_set_file] =  1,
        [DW_LNS_set_column] = 1,
        [DW_LNS_fixed_advance_pc] = 1,
        [DW_LNS_set_isa] = 1,
};
#endif

/* field filled at run time are marked with -1 */
static struct compilation_unit_header default_comp_unit_header = {
        .total_length = -1,
        .version = 2,
        .debug_abbrev_offset = 0,     /* we reuse the same abbrev entries for all comp unit */
        .pointer_size = sizeof(void *)
};

static void emit_uword(struct buffer_ext *be, uword data)
{
        buffer_ext_add(be, &data, sizeof(uword));
}

static void emit_string(struct buffer_ext *be, const char *s)
{
        buffer_ext_add(be, (void *)s, strlen(s) + 1);
}

static void emit_unsigned_LEB128(struct buffer_ext *be,
                                 unsigned long data)
{
        do {
                ubyte cur = data & 0x7F;
                data >>= 7;
                if (data)
                        cur |= 0x80;
                buffer_ext_add(be, &cur, 1);
        } while (data);
}

static void emit_signed_LEB128(struct buffer_ext *be, long data)
{
        int more = 1;
        int negative = data < 0;
        int size = sizeof(long) * CHAR_BIT;
        while (more) {
                ubyte cur = data & 0x7F;
                data >>= 7;
                if (negative)
                        data |= - (1 << (size - 7));
                if ((data == 0 && !(cur & 0x40)) ||
                    (data == -1l && (cur & 0x40)))
                        more = 0;
                else
                        cur |= 0x80;
                buffer_ext_add(be, &cur, 1);
        }
}

static void emit_extended_opcode(struct buffer_ext *be, ubyte opcode,
                                 void *data, size_t data_len)
{
        buffer_ext_add(be, (char *)"", 1);

        emit_unsigned_LEB128(be, data_len + 1);

        buffer_ext_add(be, &opcode, 1);
        buffer_ext_add(be, data, data_len);
}

static void emit_opcode(struct buffer_ext *be, ubyte opcode)
{
        buffer_ext_add(be, &opcode, 1);
}

static void emit_opcode_signed(struct buffer_ext  *be,
                               ubyte opcode, long data)
{
        buffer_ext_add(be, &opcode, 1);
        emit_signed_LEB128(be, data);
}

static void emit_opcode_unsigned(struct buffer_ext *be, ubyte opcode,
                                 unsigned long data)
{
        buffer_ext_add(be, &opcode, 1);
        emit_unsigned_LEB128(be, data);
}

static void emit_advance_pc(struct buffer_ext *be, unsigned long delta_pc)
{
        emit_opcode_unsigned(be, DW_LNS_advance_pc, delta_pc);
}

static void emit_advance_lineno(struct buffer_ext  *be, long delta_lineno)
{
        emit_opcode_signed(be, DW_LNS_advance_line, delta_lineno);
}

static void emit_lne_end_of_sequence(struct buffer_ext *be)
{
        emit_extended_opcode(be, DW_LNE_end_sequence, NULL, 0);
}

static void emit_set_file(struct buffer_ext *be, unsigned long idx)
{
        emit_opcode_unsigned(be, DW_LNS_set_file, idx);
}

static void emit_lne_define_filename(struct buffer_ext *be,
                                     const char *filename)
{
        buffer_ext_add(be, (void *)"", 1);

        /* LNE field, strlen(filename) + zero termination, 3 bytes for: the dir entry, timestamp, filesize */
        emit_unsigned_LEB128(be, strlen(filename) + 5);
        emit_opcode(be, DW_LNE_define_file);
        emit_string(be, filename);
        /* directory index 0=do not know */
        emit_unsigned_LEB128(be, 0);
        /* last modification date on file 0=do not know */
        emit_unsigned_LEB128(be, 0);
        /* filesize 0=do not know */
        emit_unsigned_LEB128(be, 0);
}

static void emit_lne_set_address(struct buffer_ext *be,
                                 void *address)
{
        emit_extended_opcode(be, DW_LNE_set_address, &address, sizeof(unsigned long));
}

static ubyte get_special_opcode(struct debug_entry *ent,
                                unsigned int last_line,
                                unsigned long last_vma)
{
        unsigned int temp;
        unsigned long delta_addr;

        /*
         * delta from line_base
         */
        temp = (ent->lineno - last_line) - default_debug_line_header.line_base;

        if (temp >= default_debug_line_header.line_range)
                return 0;

        /*
         * delta of addresses
         */
        delta_addr = (ent->addr - last_vma) / default_debug_line_header.minimum_instruction_length;

        /* This is not sufficient to ensure opcode will be in [0-256] but
         * sufficient to ensure when summing with the delta lineno we will
         * not overflow the unsigned long opcode */

        if (delta_addr <= 256 / default_debug_line_header.line_range) {
                unsigned long opcode = temp +
                        (delta_addr * default_debug_line_header.line_range) +
                        default_debug_line_header.opcode_base;

                return opcode <= 255 ? opcode : 0;
        }
        return 0;
}

static void emit_lineno_info(struct buffer_ext *be,
                             struct debug_entry *ent, size_t nr_entry,
                             unsigned long code_addr)
{
        size_t i;

        /* as described in the jitdump format */
        const char repeated_name_marker[] = {'\xff', '\0'};

        /*
         * Machine state at start of a statement program
         * address = 0
         * file    = 1
         * line    = 1
         * column  = 0
         * is_stmt = default_is_stmt as given in the debug_line_header
         * basic block = 0
         * end sequence = 0
         */

        /* start state of the state machine we take care of */
        unsigned long last_vma = 0;
        char const  *cur_filename = NULL;
        unsigned long cur_file_idx = 0;
        int last_line = 1;

        emit_lne_set_address(be, (void *)code_addr);

        for (i = 0; i < nr_entry; i++, ent = debug_entry_next(ent)) {
                int need_copy = 0;
                ubyte special_opcode;

                /*
                 * check if filename changed, if so add it
                 */
                if ((!cur_filename || strcmp(cur_filename, ent->name)) &&
                        strcmp(repeated_name_marker, ent->name)) {
                        emit_lne_define_filename(be, ent->name);
                        cur_filename = ent->name;
                        emit_set_file(be, ++cur_file_idx);
                        need_copy = 1;
                }

                special_opcode = get_special_opcode(ent, last_line, last_vma);
                if (special_opcode != 0) {
                        last_line = ent->lineno;
                        last_vma  = ent->addr;
                        emit_opcode(be, special_opcode);
                } else {
                        /*
                         * lines differ, emit line delta
                         */
                        if (last_line != ent->lineno) {
                                emit_advance_lineno(be, ent->lineno - last_line);
                                last_line = ent->lineno;
                                need_copy = 1;
                        }
                        /*
                         * addresses differ, emit address delta
                         */
                        if (last_vma != ent->addr) {
                                emit_advance_pc(be, ent->addr - last_vma);
                                last_vma = ent->addr;
                                need_copy = 1;
                        }
                        /*
                         * add new row to matrix
                         */
                        if (need_copy)
                                emit_opcode(be, DW_LNS_copy);
                }
        }
}

static void add_debug_line(struct buffer_ext *be,
        struct debug_entry *ent, size_t nr_entry,
        unsigned long code_addr)
{
        struct debug_line_header * dbg_header;
        size_t old_size;

        old_size = buffer_ext_size(be);

        buffer_ext_add(be, (void *)&default_debug_line_header,
                 sizeof(default_debug_line_header));

        buffer_ext_add(be, &standard_opcode_length,  sizeof(standard_opcode_length));

        // empty directory entry
        buffer_ext_add(be, (void *)"", 1);

        // empty filename directory
        buffer_ext_add(be, (void *)"", 1);

        dbg_header = buffer_ext_addr(be) + old_size;
        dbg_header->prolog_length = (buffer_ext_size(be) - old_size) -
                offsetof(struct debug_line_header, minimum_instruction_length);

        emit_lineno_info(be, ent, nr_entry, code_addr);

        emit_lne_end_of_sequence(be);

        dbg_header = buffer_ext_addr(be) + old_size;
        dbg_header->total_length = (buffer_ext_size(be) - old_size) -
                offsetof(struct debug_line_header, version);
}

static void
add_debug_abbrev(struct buffer_ext *be)
{
        emit_unsigned_LEB128(be, 1);
        emit_unsigned_LEB128(be, DW_TAG_compile_unit);
        emit_unsigned_LEB128(be, DW_CHILDREN_yes);
        emit_unsigned_LEB128(be, DW_AT_stmt_list);
        emit_unsigned_LEB128(be, DW_FORM_data4);
        emit_unsigned_LEB128(be, 0);
        emit_unsigned_LEB128(be, 0);
        emit_unsigned_LEB128(be, 0);
}

static void
add_compilation_unit(struct buffer_ext *be,
                     size_t offset_debug_line)
{
        struct compilation_unit_header *comp_unit_header;
        size_t old_size = buffer_ext_size(be);

        buffer_ext_add(be, &default_comp_unit_header,
                       sizeof(default_comp_unit_header));

        emit_unsigned_LEB128(be, 1);
        emit_uword(be, offset_debug_line);

        comp_unit_header = buffer_ext_addr(be) + old_size;
        comp_unit_header->total_length = (buffer_ext_size(be) - old_size) -
                offsetof(struct compilation_unit_header, version);
}

static int
jit_process_debug_info(uint64_t code_addr,
                       void *debug, int nr_debug_entries,
                       struct buffer_ext *dl,
                       struct buffer_ext *da,
                       struct buffer_ext *di)
{
        struct debug_entry *ent = debug;
        int i;

        for (i = 0; i < nr_debug_entries; i++) {
                ent->addr = ent->addr - code_addr;
                ent = debug_entry_next(ent);
        }
        add_compilation_unit(di, buffer_ext_size(dl));
        add_debug_line(dl, debug, nr_debug_entries, GEN_ELF_TEXT_OFFSET);
        add_debug_abbrev(da);
        if (0) buffer_ext_dump(da, "abbrev");

        return 0;
}

int
jit_add_debug_info(Elf *e, uint64_t code_addr, void *debug, int nr_debug_entries)
{
        Elf_Data *d;
        Elf_Scn *scn;
        Elf_Shdr *shdr;
        struct buffer_ext dl, di, da;
        int ret = -1;

        buffer_ext_init(&dl);
        buffer_ext_init(&di);
        buffer_ext_init(&da);

        if (jit_process_debug_info(code_addr, debug, nr_debug_entries, &dl, &da, &di))
                goto out;

        /*
         * setup .debug_line section
         */
        scn = elf_newscn(e);
        if (!scn) {
                warnx("cannot create section");
                goto out;
        }

        d = elf_newdata(scn);
        if (!d) {
                warnx("cannot get new data");
                goto out;
        }

        d->d_align = 1;
        d->d_off = 0LL;
        d->d_buf = buffer_ext_addr(&dl);
        d->d_type = ELF_T_BYTE;
        d->d_size = buffer_ext_size(&dl);
        d->d_version = EV_CURRENT;

        shdr = elf_getshdr(scn);
        if (!shdr) {
                warnx("cannot get section header");
                goto out;
        }

        shdr->sh_name = 52; /* .debug_line */
        shdr->sh_type = SHT_PROGBITS;
        shdr->sh_addr = 0; /* must be zero or == sh_offset -> dynamic object */
        shdr->sh_flags = 0;
        shdr->sh_entsize = 0;

        /*
         * setup .debug_info section
         */
        scn = elf_newscn(e);
        if (!scn) {
                warnx("cannot create section");
                goto out;
        }

        d = elf_newdata(scn);
        if (!d) {
                warnx("cannot get new data");
                goto out;
        }

        d->d_align = 1;
        d->d_off = 0LL;
        d->d_buf = buffer_ext_addr(&di);
        d->d_type = ELF_T_BYTE;
        d->d_size = buffer_ext_size(&di);
        d->d_version = EV_CURRENT;

        shdr = elf_getshdr(scn);
        if (!shdr) {
                warnx("cannot get section header");
                goto out;
        }

        shdr->sh_name = 64; /* .debug_info */
        shdr->sh_type = SHT_PROGBITS;
        shdr->sh_addr = 0; /* must be zero or == sh_offset -> dynamic object */
        shdr->sh_flags = 0;
        shdr->sh_entsize = 0;

        /*
         * setup .debug_abbrev section
         */
        scn = elf_newscn(e);
        if (!scn) {
                warnx("cannot create section");
                goto out;
        }

        d = elf_newdata(scn);
        if (!d) {
                warnx("cannot get new data");
                goto out;
        }

        d->d_align = 1;
        d->d_off = 0LL;
        d->d_buf = buffer_ext_addr(&da);
        d->d_type = ELF_T_BYTE;
        d->d_size = buffer_ext_size(&da);
        d->d_version = EV_CURRENT;

        shdr = elf_getshdr(scn);
        if (!shdr) {
                warnx("cannot get section header");
                goto out;
        }

        shdr->sh_name = 76; /* .debug_info */
        shdr->sh_type = SHT_PROGBITS;
        shdr->sh_addr = 0; /* must be zero or == sh_offset -> dynamic object */
        shdr->sh_flags = 0;
        shdr->sh_entsize = 0;

        /*
         * now we update the ELF image with all the sections
         */
        if (elf_update(e, ELF_C_WRITE) < 0)
                warnx("elf_update debug failed");
        else
                ret = 0;

out:
        buffer_ext_exit(&dl);
        buffer_ext_exit(&di);
        buffer_ext_exit(&da);
        return ret;
}