/* SPDX-License-Identifier: GPL-2.0 */ /* * Generate opcode table initializers for the in-kernel disassembler. * * Copyright IBM Corp. 2017 * */ #include <stdlib.h> #include <string.h> #include <ctype.h> #include <stdio.h> #define STRING_SIZE_MAX 20 struct insn_type { unsigned char byte; unsigned char mask; char **format; }; struct insn { struct insn_type *type; char opcode[STRING_SIZE_MAX]; char name[STRING_SIZE_MAX]; char upper[STRING_SIZE_MAX]; char format[STRING_SIZE_MAX]; unsigned int name_len; }; struct insn_group { struct insn_type *type; int offset; int count; char opcode[2]; }; struct insn_format { char *format; int type; }; struct gen_opcode { struct insn *insn; int nr; struct insn_group *group; int nr_groups; }; /* * Table of instruction format types. Each opcode is defined with at * least one byte (two nibbles), three nibbles, or two bytes (four * nibbles). * The byte member of each instruction format type entry defines * within which byte of an instruction the third (and fourth) nibble * of an opcode can be found. The mask member is the and-mask that * needs to be applied on this byte in order to get the third (and * fourth) nibble of the opcode. * The format array defines all instruction formats (as defined in the * Principles of Operation) which have the same position of the opcode * nibbles. * A special case are instruction formats with 1-byte opcodes. In this * case the byte member always is zero, so that the mask is applied on * the (only) byte that contains the opcode. */ static struct insn_type insn_type_table[] = { { .byte = 0, .mask = 0xff, .format = (char *[]) { "MII", "RR", "RS", "RSI", "RX", "SI", "SMI", "SS", NULL, }, }, { .byte = 1, .mask = 0x0f, .format = (char *[]) { "RI", "RIL", "SSF", NULL, }, }, { .byte = 1, .mask = 0xff, .format = (char *[]) { "E", "IE", "RRE", "RRF", "RRR", "S", "SIL", "SSE", NULL, }, }, { .byte = 5, .mask = 0xff, .format = (char *[]) { "RIE", "RIS", "RRS", "RSE", "RSL", "RSY", "RXE", "RXF", "RXY", "SIY", "VRI", "VRR", "VRS", "VRV", "VRX", "VSI", NULL, }, }, }; static struct insn_type *insn_format_to_type(char *format) { char tmp[STRING_SIZE_MAX]; char *base_format, **ptr; int i; strcpy(tmp, format); base_format = tmp; base_format = strsep(&base_format, "_"); for (i = 0; i < sizeof(insn_type_table) / sizeof(insn_type_table[0]); i++) { ptr = insn_type_table[i].format; while (*ptr) { if (!strcmp(base_format, *ptr)) return &insn_type_table[i]; ptr++; } } exit(EXIT_FAILURE); } static void read_instructions(struct gen_opcode *desc) { struct insn insn; int rc, i; while (1) { rc = scanf("%s %s %s", insn.opcode, insn.name, insn.format); if (rc == EOF) break; if (rc != 3) exit(EXIT_FAILURE); insn.type = insn_format_to_type(insn.format); insn.name_len = strlen(insn.name); for (i = 0; i <= insn.name_len; i++) insn.upper[i] = toupper((unsigned char)insn.name[i]); desc->nr++; desc->insn = realloc(desc->insn, desc->nr * sizeof(*desc->insn)); if (!desc->insn) exit(EXIT_FAILURE); desc->insn[desc->nr - 1] = insn; } } static int cmpformat(const void *a, const void *b) { return strcmp(((struct insn *)a)->format, ((struct insn *)b)->format); } static void print_formats(struct gen_opcode *desc) { char *format; int i, count; qsort(desc->insn, desc->nr, sizeof(*desc->insn), cmpformat); format = ""; count = 0; printf("enum {\n"); for (i = 0; i < desc->nr; i++) { if (!strcmp(format, desc->insn[i].format)) continue; count++; format = desc->insn[i].format; printf("\tINSTR_%s,\n", format); } printf("}; /* %d */\n\n", count); } static int cmp_long_insn(const void *a, const void *b) { return strcmp(((struct insn *)a)->name, ((struct insn *)b)->name); } static void print_long_insn(struct gen_opcode *desc) { struct insn *insn; int i, count; qsort(desc->insn, desc->nr, sizeof(*desc->insn), cmp_long_insn); count = 0; printf("enum {\n"); for (i = 0; i < desc->nr; i++) { insn = &desc->insn[i]; if (insn->name_len < 6) continue; printf("\tLONG_INSN_%s,\n", insn->upper); count++; } printf("}; /* %d */\n\n", count); printf("#define LONG_INSN_INITIALIZER { \\\n"); for (i = 0; i < desc->nr; i++) { insn = &desc->insn[i]; if (insn->name_len < 6) continue; printf("\t[LONG_INSN_%s] = \"%s\", \\\n", insn->upper, insn->name); } printf("}\n\n"); } static void print_opcode(struct insn *insn, int nr) { char *opcode; opcode = insn->opcode; if (insn->type->byte != 0) opcode += 2; printf("\t[%4d] = { .opfrag = 0x%s, .format = INSTR_%s, ", nr, opcode, insn->format); if (insn->name_len < 6) printf(".name = \"%s\" ", insn->name); else printf(".offset = LONG_INSN_%s ", insn->upper); printf("}, \\\n"); } static void add_to_group(struct gen_opcode *desc, struct insn *insn, int offset) { struct insn_group *group; group = desc->group ? &desc->group[desc->nr_groups - 1] : NULL; if (group && (!strncmp(group->opcode, insn->opcode, 2) || group->type->byte == 0)) { group->count++; return; } desc->nr_groups++; desc->group = realloc(desc->group, desc->nr_groups * sizeof(*desc->group)); if (!desc->group) exit(EXIT_FAILURE); group = &desc->group[desc->nr_groups - 1]; memcpy(group->opcode, insn->opcode, 2); group->type = insn->type; group->offset = offset; group->count = 1; } static int cmpopcode(const void *a, const void *b) { return strcmp(((struct insn *)a)->opcode, ((struct insn *)b)->opcode); } static void print_opcode_table(struct gen_opcode *desc) { char opcode[2] = ""; struct insn *insn; int i, offset; qsort(desc->insn, desc->nr, sizeof(*desc->insn), cmpopcode); printf("#define OPCODE_TABLE_INITIALIZER { \\\n"); offset = 0; for (i = 0; i < desc->nr; i++) { insn = &desc->insn[i]; if (insn->type->byte == 0) continue; add_to_group(desc, insn, offset); if (strncmp(opcode, insn->opcode, 2)) { memcpy(opcode, insn->opcode, 2); printf("\t/* %.2s */ \\\n", opcode); } print_opcode(insn, offset); offset++; } printf("\t/* 1-byte opcode instructions */ \\\n"); for (i = 0; i < desc->nr; i++) { insn = &desc->insn[i]; if (insn->type->byte != 0) continue; add_to_group(desc, insn, offset); print_opcode(insn, offset); offset++; } printf("}\n\n"); } static void print_opcode_table_offsets(struct gen_opcode *desc) { struct insn_group *group; int i; printf("#define OPCODE_OFFSET_INITIALIZER { \\\n"); for (i = 0; i < desc->nr_groups; i++) { group = &desc->group[i]; printf("\t{ .opcode = 0x%.2s, .mask = 0x%02x, .byte = %d, .offset = %d, .count = %d }, \\\n", group->opcode, group->type->mask, group->type->byte, group->offset, group->count); } printf("}\n\n"); } int main(int argc, char **argv) { struct gen_opcode _desc = { 0 }; struct gen_opcode *desc = &_desc; read_instructions(desc); printf("#ifndef __S390_GENERATED_DIS_DEFS_H__\n"); printf("#define __S390_GENERATED_DIS_DEFS_H__\n"); printf("/*\n"); printf(" * DO NOT MODIFY.\n"); printf(" *\n"); printf(" * This file was generated by %s\n", __FILE__); printf(" */\n\n"); print_formats(desc); print_long_insn(desc); print_opcode_table(desc); print_opcode_table_offsets(desc); printf("#endif\n"); exit(EXIT_SUCCESS); }