hibot/source/syntax.h

335 lines
16 KiB
C

#include <string.h>
#define SYNTAX_LIMIT (256)
#define COLOUR_WHITE ("00")
#define COLOUR_BLUE ("02")
#define COLOUR_GREEN ("03")
#define COLOUR_RED ("04")
#define COLOUR_BROWN ("05")
#define COLOUR_MAGENTA ("06")
#define COLOUR_ORANGE ("07")
#define COLOUR_YELLOW ("08")
#define COLOUR_CYAN ("11")
#define COLOUR_PINK ("13")
#define COLOUR_GREY ("14")
extern void syntax_c (void);
extern void syntax_ada (void);
extern void syntax_cpp (void);
extern void syntax_fasm (void);
extern char * syntax_highlight (char * string);
static size_t syntax_count = 0;
static int syntax_enrange [SYNTAX_LIMIT];
static int syntax_derange [SYNTAX_LIMIT];
static char syntax_begin [SYNTAX_LIMIT] [96];
static char syntax_end [SYNTAX_LIMIT] [96];
static char syntax_escape [SYNTAX_LIMIT];
static char * syntax_colour [SYNTAX_LIMIT];
static int character_compare_array (char character, char * character_array) {
size_t i = 0;
do {
if (character == character_array [i]) {
return (1);
}
} while (++i != strlen (character_array));
return (0);
}
static void syntax_rule (int enrange,
int derange,
char * begin,
char * end,
char escape,
char * colour) {
if (syntax_count >= SYNTAX_LIMIT) {
return;
}
strncpy (syntax_begin [syntax_count], begin, 96);
strncpy (syntax_end [syntax_count], end, 96);
syntax_enrange [syntax_count] = enrange;
syntax_derange [syntax_count] = derange;
syntax_escape [syntax_count] = escape;
syntax_colour [syntax_count] = colour;
++syntax_count;
}
static size_t syntax_loop (char * string,
size_t * length) {
size_t offset, subset, select;
for (select = offset = 0; select != syntax_count; ++select) {
if (syntax_enrange [select] == 0) {
if (syntax_derange [select] == 0) {
if (strncmp (string, syntax_begin [select], strlen (syntax_begin [select])) == 0) {
break;
}
} else {
if ((strncmp (string, syntax_begin [select], strlen (syntax_begin [select])) == 0)
&& (character_compare_array (string [offset + strlen (syntax_begin [select])], syntax_end [select]) == 1)) {
break;
}
}
} else {
for (subset = 0; subset != strlen (syntax_begin [select]); ++subset) {
if (string [offset] == syntax_begin [select] [subset]) {
goto selected;
}
}
}
}
selected:
if (select >= syntax_count) {
* length = 1;
return (select);
}
for (offset = 1; string [offset - 1] != '\0'; ++offset) {
if (string [offset] == syntax_escape [select]) {
++offset;
continue;
}
if (syntax_derange [select] == 0) {
if (strncmp (& string [offset], syntax_end [select], strlen (syntax_end [select])) == 0) {
* length = offset + strlen (syntax_end [select]);
goto finished;
}
} else {
subset = 0;
if (strcmp (syntax_end [select], "") == 0) {
break;
} do {
if (string [offset] == syntax_end [select] [subset]) {
* length = offset;
goto finished;
}
} while (++subset != strlen (syntax_end [select]));
}
}
finished:
return (select);
}
void syntax_c (void) {
char * separators = ".,:;<=>+-*/%!&~^?|()[]{}'\" \t\r\n";
char * keywords [] = {
"register", "volatile", "auto", "const", "static", "extern", "if", "else",
"do", "while", "for", "continue", "switch", "case", "default", "break",
"enum", "union", "struct", "typedef", "goto", "void", "return", "sizeof",
"char", "short", "int", "long", "signed", "unsigned", "float", "double"
};
size_t word;
syntax_rule (0, 0, "/*", "*/", '\0', COLOUR_GREY);
syntax_rule (0, 0, "//", "\n", '\0', COLOUR_GREY);
syntax_rule (0, 0, "#", "\n", '\\', COLOUR_YELLOW);
syntax_rule (0, 0, "'", "'", '\\', COLOUR_PINK);
syntax_rule (0, 0, "\"", "\"", '\\', COLOUR_PINK);
for (word = 0; word != sizeof (keywords) / sizeof (keywords [0]); ++word) {
syntax_rule (0, 1, keywords [word], separators, '\0', COLOUR_YELLOW);
}
syntax_rule (1, 0, "()[]{}", "", '\0', COLOUR_BLUE);
syntax_rule (1, 0, ".,:;<=>+*-/%!&~^?|", "", '\0', COLOUR_CYAN);
syntax_rule (1, 1, "0123456789", separators, '\0', COLOUR_PINK);
syntax_rule (1, 1, "abcdefghijklmnopqrstuvwxyz", separators, '\0', COLOUR_WHITE);
syntax_rule (1, 1, "ABCDEFGHIJKLMNOPQRSTUVWXYZ", separators, '\0', COLOUR_WHITE);
syntax_rule (1, 1, "_", separators, '\0', COLOUR_WHITE);
}
void syntax_ada (void) {
char * separators = ".,:;<=>+-*/&|()\" \t\r\n";
char * keywords [] = {
"abort", "else", "new", "return", "abs", "elsif", "not", "reverse",
"abstract", "end", "null", "accept", "entry", "select", "access", "of",
"separate", "aliased", "exit", "or", "some", "all", "others", "subtype",
"and", "for", "out", "array", "function", "at", "tagged", "generic",
"package", "task", "begin", "goto", "pragma", "body", "private", "then",
"type", "case", "in", "constant", "until", "is", "raise", "use",
"if", "declare", "range", "delay", "limited", "record", "when", "delta",
"loop", "rem", "while", "digits", "renames", "with", "do", "mod",
"requeue", "xor", "procedure", "protected", "interface", "synchronized", "exception", "overriding",
"terminate"
};
size_t word;
syntax_rule (0, 0, "--", "\n", '\0', COLOUR_GREY);
syntax_rule (0, 0, "'", "'", '\\', COLOUR_PINK);
syntax_rule (0, 0, "\"", "\"", '\\', COLOUR_PINK);
for (word = 0; word != sizeof (keywords) / sizeof (keywords [0]); ++word) {
syntax_rule (0, 1, keywords [word], separators, '\0', COLOUR_YELLOW);
}
syntax_rule (1, 0, "()", "", '\0', COLOUR_BLUE);
syntax_rule (1, 0, ".,:;<=>+-*/&|'", "", '\0', COLOUR_CYAN);
syntax_rule (1, 1, "0123456789", separators, '\0', COLOUR_PINK);
syntax_rule (1, 1, "abcdefghijklmnopqrstuvwxyz", separators, '\0', COLOUR_WHITE);
syntax_rule (1, 1, "ABCDEFGHIJKLMNOPQRSTUVWXYZ", separators, '\0', COLOUR_WHITE);
}
void syntax_cpp (void) {
char * separators = ".,:;<=>+-*/%!&~^?|()[]{}'\" \t\r\n";
char * keywords [] = {
"alignas", "alignof", "and", "and_eq", "asm", "atomic_cancel", "atomic_commit", "atomic_noexcept",
"auto", "bitand", "bitor", "bool", "break", "case", "catch", "char",
"char8_t", "char16_t", "char32_t", "class", "compl", "concept", "const", "consteval",
"constexpr", "constinit", "const_cast", "continue", "co_await", "co_return", "co_yield", "decltype",
"default", "delete", "do", "double", "dynamic_cast", "else", "enum", "explicit",
"export", "extern", "false", "float", "for", "friend", "goto", "if",
"inline", "int", "long", "mutable", "namespace", "new", "noexcept", "not",
"not_eq", "nullptr", "operator", "or", "or_eq", "private", "protected", "public",
"reflexpr", "register", "reinterpret_cast", "requires", "return", "short", "signed", "sizeof",
"static", "static_assert", "static_cast", "struct", "switch", "synchronized", "template", "this",
"thread_local", "throw", "true", "try", "typedef", "typeid", "typename", "union",
"unsigned", "using", "virtual", "void", "volatile", "wchar_t", "while", "xor",
"xor_eq", "final", "override", "import", "module", "transaction_safe"
};
char * specials [] = {
"int8_t", "int16_t", "int32_t", "int64_t", "uint8_t", "uint16_t", "uint32_t", "uint64_t",
"FILE", "std", "typeof", "cout", "cin", "endl", "timespec", "tm"
/* TODO: I don't really care about this, but some people do, Anon please add what you find interesting in here... */
};
size_t word;
syntax_rule (0, 0, "/*", "*/", '\0', COLOUR_GREY);
syntax_rule (0, 0, "//", "\n", '\0', COLOUR_GREY);
syntax_rule (0, 0, "#", "\n", '\\', COLOUR_YELLOW);
syntax_rule (0, 0, "'", "'", '\\', COLOUR_PINK);
syntax_rule (0, 0, "\"", "\"", '\\', COLOUR_PINK);
for (word = 0; word != sizeof (keywords) / sizeof (keywords [0]); ++word) {
syntax_rule (0, 1, keywords [word], separators, '\0', COLOUR_YELLOW);
}
for (word = 0; word != sizeof (specials) / sizeof (specials [0]); ++word) {
syntax_rule (0, 1, specials [word], separators, '\0', COLOUR_CYAN);
}
syntax_rule (1, 0, "()[]{}", "", '\0', COLOUR_BLUE);
syntax_rule (1, 0, ".,:;<=>+*-/%!&~^?|", "", '\0', COLOUR_CYAN);
syntax_rule (1, 1, "0123456789", separators, '\0', COLOUR_PINK);
syntax_rule (1, 1, "abcdefghijklmnopqrstuvwxyz", separators, '\0', COLOUR_WHITE);
syntax_rule (1, 1, "ABCDEFGHIJKLMNOPQRSTUVWXYZ", separators, '\0', COLOUR_WHITE);
syntax_rule (1, 1, "_", separators, '\0', COLOUR_WHITE);
}
void syntax_fasm (void) {
char * separators = ".,+-=:;(){}[]%$<> \t\r\n";
char * instructions [] = {
"mov", "movabs", "movapd", "movaps", "movebe", "movsd", "movsx", "movzx",
"movsxd", "movd", "movq", "movs", "movsb", "movsw", "movsd", "movsq",
"cmovmp", "cmovrcxz", "cmovc", "cmovnc", "cmove", "cmovne", "cmovz", "cmovnz",
"cmovg", "cmovng", "cmovge", "cmovnge", "cmovl", "cmovnl", "cmovle", "cmovnle",
"cmova", "cmovna", "cmovae", "cmovnae", "cmovb", "cmovnb", "cmovbe", "cmovnbe",
"cmovs", "cmovns", "cmovo", "cmovno", "cmovp", "cmovnp", "cmovpo", "cmovpe",
"cmp", "cmps", "cmpsb", "cmpsw", "cmpsd", "cmpsq", "cmpxchg", "lea",
"monitor", "cpuid", "in", "out", "syscall", "sysenter", "sysret", "sysexit",
"swap", "bswap", "pop", "push", "call", "ret", "enter", "leave",
"and", "or", "not", "neg", "sal", "sar", "shl", "shr",
"inc", "dec", "add", "sub", "mul", "div", "imul", "idiv",
"nop", "fnop", "adc", "sbb", "aaa", "aas", "aam", "aad",
"jmp", "jrcxz", "jc", "jnc", "je", "jne", "jz", "jnz",
"jg", "jng", "jge", "jnge", "jl", "jnl", "jle", "jnle",
"ja", "jna", "jae", "jnae", "jb", "jnb", "jbe", "jnbe",
"js", "jns", "jo", "jno", "jp", "jnp", "jpo", "jpe",
"rep", "repe", "repz", "repne", "repnz", "loop", "loope", "loopne"
};
char * registers [] = {
"rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi",
"r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15",
"eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi",
"r8d", "r9d", "r10d", "r11d", "r12d", "r13d", "r14d", "r15d",
"ax", "cx", "dx", "bx", "sp", "bp", "si", "di",
"r8w", "r9w", "r10w", "r11w", "r12w", "r13w", "r14w", "r15w",
"al", "cl", "dl", "bl", "spl", "bpl", "sil", "dil",
"r8b", "r9b", "r10b", "r11b", "r12b", "r13b", "r14b", "r15b",
"ah", "ch", "dh", "bh"
};
char * keywords [] = {
"format", "executable", "readable", "writable", "segment", "sector", "entry", "macro",
"db", "dw", "dd", "dq", "rb", "rw", "rd", "rq"
};
size_t word;
syntax_rule (0, 0, ";", "\n", '\0', COLOUR_GREY);
syntax_rule (0, 0, "'", "'", '\\', COLOUR_PINK);
syntax_rule (0, 0, "\"", "\"", '\\', COLOUR_PINK);
for (word = 0; word != sizeof (instructions) / sizeof (instructions [0]); ++word) {
syntax_rule (0, 1, instructions [word], separators, '\0', COLOUR_YELLOW);
}
for (word = 0; word != sizeof (registers) / sizeof (registers [0]); ++word) {
syntax_rule (0, 1, registers [word], separators, '\0', COLOUR_CYAN);
}
for (word = 0; word != sizeof (keywords) / sizeof (keywords [0]); ++word) {
syntax_rule (0, 1, keywords [word], separators, '\0', COLOUR_YELLOW);
}
syntax_rule (1, 0, "()[]{}", "", '\0', COLOUR_BLUE);
syntax_rule (1, 0, ".,+-=:;%$<>", "", '\0', COLOUR_CYAN);
syntax_rule (1, 1, "0123456789", separators, '\0', COLOUR_PINK);
syntax_rule (1, 1, "abcdefghijklmnopqrstuvwxyz", separators, '\0', COLOUR_WHITE);
syntax_rule (1, 1, "ABCDEFGHIJKLMNOPQRSTUVWXYZ", separators, '\0', COLOUR_WHITE);
syntax_rule (1, 1, "_", separators, '\0', COLOUR_WHITE);
}
char * syntax_highlight (char * code) {
static char buffer [4096] = "";
static char string [4096] = "";
size_t select, length, offset;
memset (buffer, 0, sizeof (buffer));
memset (string, 0, sizeof (string));
strcpy (string, code);
for (offset = 0; offset < strlen (string); offset += length) {
select = syntax_loop (& string [offset], & length);
if (select < syntax_count) {
strncat (buffer, "\003", 1);
strncat (buffer, syntax_colour [select], 2);
strncat (buffer, & string [offset], (size_t) length);
strncat (buffer, "\017", 1);
} else {
strncat (buffer, & string [offset], (size_t) length);
}
}
return (buffer);
}