- Moved all language highlighter implementations (`CppHighlighter`, `GoHighlighter`, `JsonHighlighter`, etc.), the engine, and registry to `syntax/`.
156 lines
3.8 KiB
C++
156 lines
3.8 KiB
C++
#include "SqlHighlighter.h"
|
|
#include "../Buffer.h"
|
|
#include <cctype>
|
|
|
|
namespace kte {
|
|
static void
|
|
push(std::vector<HighlightSpan> &out, int a, int b, TokenKind k)
|
|
{
|
|
if (b > a)
|
|
out.push_back({a, b, k});
|
|
}
|
|
|
|
|
|
static bool
|
|
is_ident_start(char c)
|
|
{
|
|
return std::isalpha(static_cast<unsigned char>(c)) || c == '_';
|
|
}
|
|
|
|
|
|
static bool
|
|
is_ident_char(char c)
|
|
{
|
|
return std::isalnum(static_cast<unsigned char>(c)) || c == '_' || c == '$';
|
|
}
|
|
|
|
|
|
SqlHighlighter::SqlHighlighter()
|
|
{
|
|
const char *kw[] = {
|
|
"select", "insert", "update", "delete", "from", "where", "group", "by", "order", "limit",
|
|
"offset", "values", "into", "create", "table", "index", "unique", "on", "as", "and", "or",
|
|
"not", "null", "is", "primary", "key", "constraint", "foreign", "references", "drop", "alter",
|
|
"add", "column", "rename", "to", "if", "exists", "join", "left", "right", "inner", "outer",
|
|
"cross", "using", "set", "distinct", "having", "union", "all", "case", "when", "then", "else",
|
|
"end", "pragma", "transaction", "begin", "commit", "rollback", "replace"
|
|
};
|
|
for (auto s: kw)
|
|
kws_.insert(s);
|
|
|
|
const char *types[] = {"integer", "real", "text", "blob", "numeric", "boolean", "date", "datetime"};
|
|
for (auto s: types)
|
|
types_.insert(s);
|
|
}
|
|
|
|
|
|
void
|
|
SqlHighlighter::HighlightLine(const Buffer &buf, int row, std::vector<HighlightSpan> &out) const
|
|
{
|
|
const auto &rows = buf.Rows();
|
|
if (row < 0 || static_cast<std::size_t>(row) >= rows.size())
|
|
return;
|
|
std::string s = static_cast<std::string>(rows[static_cast<std::size_t>(row)]);
|
|
int n = static_cast<int>(s.size());
|
|
int i = 0;
|
|
|
|
while (i < n) {
|
|
char c = s[i];
|
|
if (c == ' ' || c == '\t') {
|
|
int j = i + 1;
|
|
while (j < n && (s[j] == ' ' || s[j] == '\t'))
|
|
++j;
|
|
push(out, i, j, TokenKind::Whitespace);
|
|
i = j;
|
|
continue;
|
|
}
|
|
// line comments: -- ...
|
|
if (c == '-' && i + 1 < n && s[i + 1] == '-') {
|
|
push(out, i, n, TokenKind::Comment);
|
|
break;
|
|
}
|
|
// simple block comment on same line: /* ... */
|
|
if (c == '/' && i + 1 < n && s[i + 1] == '*') {
|
|
int j = i + 2;
|
|
bool closed = false;
|
|
while (j + 1 <= n) {
|
|
if (j + 1 < n && s[j] == '*' && s[j + 1] == '/') {
|
|
j += 2;
|
|
closed = true;
|
|
break;
|
|
}
|
|
++j;
|
|
}
|
|
if (!closed) {
|
|
push(out, i, n, TokenKind::Comment);
|
|
break;
|
|
} else {
|
|
push(out, i, j, TokenKind::Comment);
|
|
i = j;
|
|
continue;
|
|
}
|
|
}
|
|
// strings: '...' or "..."
|
|
if (c == '\'' || c == '"') {
|
|
char q = c;
|
|
int j = i + 1;
|
|
bool esc = false;
|
|
while (j < n) {
|
|
char d = s[j++];
|
|
if (d == q) {
|
|
// Handle doubled quote escaping for SQL single quotes
|
|
if (q == '\'' && j < n && s[j] == '\'') {
|
|
++j;
|
|
continue;
|
|
}
|
|
break;
|
|
}
|
|
if (d == '\\') {
|
|
esc = !esc;
|
|
} else {
|
|
esc = false;
|
|
}
|
|
}
|
|
push(out, i, j, TokenKind::String);
|
|
i = j;
|
|
continue;
|
|
}
|
|
if (std::isdigit(static_cast<unsigned char>(c))) {
|
|
int j = i + 1;
|
|
while (j < n && (std::isalnum(static_cast<unsigned char>(s[j])) || s[j] == '.' || s[j] == '_'))
|
|
++j;
|
|
push(out, i, j, TokenKind::Number);
|
|
i = j;
|
|
continue;
|
|
}
|
|
if (is_ident_start(c)) {
|
|
int j = i + 1;
|
|
while (j < n && is_ident_char(s[j]))
|
|
++j;
|
|
std::string id = s.substr(i, j - i);
|
|
std::string lower;
|
|
lower.reserve(id.size());
|
|
for (char ch: id)
|
|
lower.push_back(static_cast<char>(std::tolower(static_cast<unsigned char>(ch))));
|
|
TokenKind k = TokenKind::Identifier;
|
|
if (kws_.count(lower))
|
|
k = TokenKind::Keyword;
|
|
else if (types_.count(lower))
|
|
k = TokenKind::Type;
|
|
push(out, i, j, k);
|
|
i = j;
|
|
continue;
|
|
}
|
|
if (std::ispunct(static_cast<unsigned char>(c))) {
|
|
TokenKind k = TokenKind::Operator;
|
|
if (c == ',' || c == ';' || c == '(' || c == ')')
|
|
k = TokenKind::Punctuation;
|
|
push(out, i, i + 1, k);
|
|
++i;
|
|
continue;
|
|
}
|
|
push(out, i, i + 1, TokenKind::Default);
|
|
++i;
|
|
}
|
|
}
|
|
} // namespace kte
|