commit 65521e4df17b2f50f25d262f5a7cd7e84dce80d2
Author: Blendi-Goose <87442375+Blendi-Goose@users.noreply.github.com>
Date: Sun Apr 12 19:22:07 2026 +0200
initial commit
diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..6e5eb67
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,2 @@
+build
+noom
diff --git a/LICENSE b/LICENSE
new file mode 100644
index 0000000..5357f69
--- /dev/null
+++ b/LICENSE
@@ -0,0 +1,166 @@
+ GNU LESSER GENERAL PUBLIC LICENSE
+ Version 3, 29 June 2007
+
+ Copyright (C) 2007 Free Software Foundation, Inc.
+ Everyone is permitted to copy and distribute verbatim copies
+ of this license document, but changing it is not allowed.
+
+
+ This version of the GNU Lesser General Public License incorporates
+the terms and conditions of version 3 of the GNU General Public
+License, supplemented by the additional permissions listed below.
+
+ 0. Additional Definitions.
+
+ As used herein, "this License" refers to version 3 of the GNU Lesser
+General Public License, and the "GNU GPL" refers to version 3 of the GNU
+General Public License.
+
+ "The Library" refers to a covered work governed by this License,
+other than an Application or a Combined Work as defined below.
+
+ An "Application" is any work that makes use of an interface provided
+by the Library, but which is not otherwise based on the Library.
+Defining a subclass of a class defined by the Library is deemed a mode
+of using an interface provided by the Library.
+
+ A "Combined Work" is a work produced by combining or linking an
+Application with the Library. The particular version of the Library
+with which the Combined Work was made is also called the "Linked
+Version".
+
+ The "Minimal Corresponding Source" for a Combined Work means the
+Corresponding Source for the Combined Work, excluding any source code
+for portions of the Combined Work that, considered in isolation, are
+based on the Application, and not on the Linked Version.
+
+ The "Corresponding Application Code" for a Combined Work means the
+object code and/or source code for the Application, including any data
+and utility programs needed for reproducing the Combined Work from the
+Application, but excluding the System Libraries of the Combined Work.
+
+ 1. Exception to Section 3 of the GNU GPL.
+
+ You may convey a covered work under sections 3 and 4 of this License
+without being bound by section 3 of the GNU GPL.
+
+ 2. Conveying Modified Versions.
+
+ If you modify a copy of the Library, and, in your modifications, a
+facility refers to a function or data to be supplied by an Application
+that uses the facility (other than as an argument passed when the
+facility is invoked), then you may convey a copy of the modified
+version:
+
+ a) under this License, provided that you make a good faith effort to
+ ensure that, in the event an Application does not supply the
+ function or data, the facility still operates, and performs
+ whatever part of its purpose remains meaningful, or
+
+ b) under the GNU GPL, with none of the additional permissions of
+ this License applicable to that copy.
+
+ 3. Object Code Incorporating Material from Library Header Files.
+
+ The object code form of an Application may incorporate material from
+a header file that is part of the Library. You may convey such object
+code under terms of your choice, provided that, if the incorporated
+material is not limited to numerical parameters, data structure
+layouts and accessors, or small macros, inline functions and templates
+(ten or fewer lines in length), you do both of the following:
+
+ a) Give prominent notice with each copy of the object code that the
+ Library is used in it and that the Library and its use are
+ covered by this License.
+
+ b) Accompany the object code with a copy of the GNU GPL and this license
+ document.
+
+ 4. Combined Works.
+
+ You may convey a Combined Work under terms of your choice that,
+taken together, effectively do not restrict modification of the
+portions of the Library contained in the Combined Work and reverse
+engineering for debugging such modifications, if you also do each of
+the following:
+
+ a) Give prominent notice with each copy of the Combined Work that
+ the Library is used in it and that the Library and its use are
+ covered by this License.
+
+ b) Accompany the Combined Work with a copy of the GNU GPL and this license
+ document.
+
+ c) For a Combined Work that displays copyright notices during
+ execution, include the copyright notice for the Library among
+ these notices, as well as a reference directing the user to the
+ copies of the GNU GPL and this license document.
+
+ d) Do one of the following:
+
+ 0) Convey the Minimal Corresponding Source under the terms of this
+ License, and the Corresponding Application Code in a form
+ suitable for, and under terms that permit, the user to
+ recombine or relink the Application with a modified version of
+ the Linked Version to produce a modified Combined Work, in the
+ manner specified by section 6 of the GNU GPL for conveying
+ Corresponding Source.
+
+ 1) Use a suitable shared library mechanism for linking with the
+ Library. A suitable mechanism is one that (a) uses at run time
+ a copy of the Library already present on the user's computer
+ system, and (b) will operate properly with a modified version
+ of the Library that is interface-compatible with the Linked
+ Version.
+
+ e) Provide Installation Information, but only if you would otherwise
+ be required to provide such information under section 6 of the
+ GNU GPL, and only to the extent that such information is
+ necessary to install and execute a modified version of the
+ Combined Work produced by recombining or relinking the
+ Application with a modified version of the Linked Version. (If
+ you use option 4d0, the Installation Information must accompany
+ the Minimal Corresponding Source and Corresponding Application
+ Code. If you use option 4d1, you must provide the Installation
+ Information in the manner specified by section 6 of the GNU GPL
+ for conveying Corresponding Source.)
+
+ 5. Combined Libraries.
+
+ You may place library facilities that are a work based on the
+Library side by side in a single library together with other library
+facilities that are not Applications and are not covered by this
+License, and convey such a combined library under terms of your
+choice, if you do both of the following:
+
+ a) Accompany the combined library with a copy of the same work based
+ on the Library, uncombined with any other library facilities,
+ conveyed under the terms of this License.
+
+ b) Give prominent notice with the combined library that part of it
+ is a work based on the Library, and explaining where to find the
+ accompanying uncombined form of the same work.
+
+ 6. Revised Versions of the GNU Lesser General Public License.
+
+ The Free Software Foundation may publish revised and/or new versions
+of the GNU Lesser General Public License from time to time. Such new
+versions will be similar in spirit to the present version, but may
+differ in detail to address new problems or concerns.
+
+ Each version is given a distinguishing version number. If the
+Library as you received it specifies that a certain numbered version
+of the GNU Lesser General Public License "or any later version"
+applies to it, you have the option of following the terms and
+conditions either of that published version or of any later version
+published by the Free Software Foundation. If the Library as you
+received it does not specify a version number of the GNU Lesser
+General Public License, you may choose any version of the GNU Lesser
+General Public License ever published by the Free Software Foundation.
+
+ If the Library as you received it specifies that a proxy can decide
+whether future versions of the GNU Lesser General Public License shall
+apply, that proxy's public statement of acceptance of any version is
+permanent authorization for you to choose that version for the
+Library.
+
diff --git a/README.md b/README.md
new file mode 100644
index 0000000..44c01fe
--- /dev/null
+++ b/README.md
@@ -0,0 +1,4 @@
+# noom
+> Lua is moon in Portuguese and noom is moon in reverse.
+
+A reimplementation of Lua, or well, it will be, it doesn't do much yet.
diff --git a/build.lua b/build.lua
new file mode 100644
index 0000000..14a7db0
--- /dev/null
+++ b/build.lua
@@ -0,0 +1,40 @@
+-- i love build scripts i love build scripts i love build scripts scripts build love i script build love me i love script build i script love build
+
+-- TODO: script the build
+
+local function filename(path)
+ local s,e = 1, #path
+ for i = 1,#path do
+ if path:sub(i,i) == '/' then s = i+1 end;
+ if path:sub(i,i) == '.' then e = i-1 end;
+ end
+
+ return path:sub(s,e)
+end
+
+local function runCommand(cmd)
+ print("> " .. cmd)
+ return os.execute(cmd)
+end
+
+runCommand('rm -r build')
+runCommand('mkdir build')
+
+local files = {
+ 'src/lexer.c',
+ 'src/helper.c',
+ 'src/main.c',
+}
+
+local objects = {}
+
+for i = 1,#files do
+ local fname = files[i]
+ local out = "build/" .. filename(fname) .. '.o'
+
+ runCommand('clang -c -o ' .. out .. ' ' .. fname)
+
+ objects[#objects+1] = out;
+end
+
+runCommand('clang -o noom ' .. table.concat(objects, ' '))
diff --git a/src/helper.c b/src/helper.c
new file mode 100644
index 0000000..02a34f2
--- /dev/null
+++ b/src/helper.c
@@ -0,0 +1,22 @@
+#include "helper.h"
+#include "types.h"
+
+int noom_startswith(const char* str, char* compare) {
+ noom_uint_t i = 0;
+ while (1) {
+ if (compare[i] == '\0') return 1; // we did it
+ if (str[i] != compare[i]) return 0;
+ i++;
+ }
+ return 0; // unreachable but whatevs
+}
+
+int noom_streql(const char* stra, noom_uint_t lena, const char* strb, noom_uint_t lenb) {
+ if (lena != lenb) return 0;
+
+ for (noom_uint_t i = 0; i < lena; i++) {
+ if (stra[i] != strb[i]) return 0;
+ }
+
+ return 1;
+}
diff --git a/src/helper.h b/src/helper.h
new file mode 100644
index 0000000..1ce78b3
--- /dev/null
+++ b/src/helper.h
@@ -0,0 +1,4 @@
+#include "types.h"
+
+int noom_startswith(const char* str, char* compare);
+int noom_streql(const char* stra, noom_uint_t lena, const char* strb, noom_uint_t lenb); // rename to something better?
diff --git a/src/lexer.c b/src/lexer.c
new file mode 100644
index 0000000..ecda06a
--- /dev/null
+++ b/src/lexer.c
@@ -0,0 +1,158 @@
+#include "types.h"
+#include "helper.h"
+#include "lexer.h"
+
+int noomL_isalpha(char c) {
+ return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z');
+}
+
+int noomL_isnumber(char c) {
+ return (c >= '0' && c <= '9');
+}
+
+int noomL_isalphanum(char c) {
+ return noomL_isalpha(c) || noomL_isnumber(c);
+}
+
+int noomL_iswhitespace(char c) {
+ return c == ' ' || c == '\r' || c == '\n' || c == '\t';
+}
+
+noom_uint_t noomL_getsymbol(const char* s) { // TODO: maybe find some less shit crap holy crap
+ if (noom_startswith(s, "...")) return 3;
+
+ if (noom_startswith(s, "==")) return 2;
+ if (noom_startswith(s, "~=")) return 2;
+ if (noom_startswith(s, "<=")) return 2;
+ if (noom_startswith(s, ">=")) return 2;
+ if (noom_startswith(s, "..")) return 2;
+
+ if (noom_startswith(s, "+")) return 1;
+ if (noom_startswith(s, "-")) return 1;
+ if (noom_startswith(s, "*")) return 1;
+ if (noom_startswith(s, "/")) return 1;
+ if (noom_startswith(s, "%")) return 1;
+ if (noom_startswith(s, "^")) return 1;
+ if (noom_startswith(s, "#")) return 1;
+ if (noom_startswith(s, "<")) return 1;
+ if (noom_startswith(s, ">")) return 1;
+
+ if (noom_startswith(s, "=")) return 1;
+ if (noom_startswith(s, ",")) return 1;
+
+ if (noom_startswith(s, "(")) return 1;
+ if (noom_startswith(s, ")")) return 1;
+ if (noom_startswith(s, "{")) return 1;
+ if (noom_startswith(s, "}")) return 1;
+ if (noom_startswith(s, "[")) return 1;
+ if (noom_startswith(s, "]")) return 1;
+
+ if (noom_startswith(s, ":")) return 1;
+ if (noom_startswith(s, ".")) return 1;
+
+ if (noom_startswith(s, ";")) return 1;
+
+ return 0; // no symbol
+}
+
+noom_uint_t noomL_getnumber(const char* s) { // TODO: more number kinds idk
+ // lazy af rn
+ noom_uint_t len = 0;
+
+ while (noomL_isnumber(s[len])) len++;
+
+ return len;
+}
+
+int noomL_iskeyword(const char* s, noom_uint_t len) {
+ if (noom_streql(s, len, "true", 4)) return 1;
+ if (noom_streql(s, len, "false", 5)) return 1;
+ if (noom_streql(s, len, "nil", 3)) return 1;
+
+ if (noom_streql(s, len, "if", 2)) return 1;
+ if (noom_streql(s, len, "then", 4)) return 1;
+ if (noom_streql(s, len, "else", 4)) return 1;
+ if (noom_streql(s, len, "elseif", 6)) return 1;
+
+ if (noom_streql(s, len, "and", 3)) return 1;
+ if (noom_streql(s, len, "or", 2)) return 1;
+ if (noom_streql(s, len, "not", 3)) return 1;
+
+ if (noom_streql(s, len, "local", 5)) return 1;
+
+ if (noom_streql(s, len, "for", 3)) return 1;
+ if (noom_streql(s, len, "function", 8)) return 1;
+ if (noom_streql(s, len, "do", 2)) return 1;
+ if (noom_streql(s, len, "until", 5)) return 1;
+ if (noom_streql(s, len, "goto", 4)) return 1;
+ if (noom_streql(s, len, "while", 5)) return 1;
+ if (noom_streql(s, len, "repeat", 6)) return 1;
+ if (noom_streql(s, len, "end", 3)) return 1;
+ if (noom_streql(s, len, "in", 2)) return 1;
+ if (noom_streql(s, len, "return", 6)) return 1;
+ if (noom_streql(s, len, "break", 5)) return 1;
+
+ return 0;
+}
+
+noomL_ErrorType noomL_lex(const char* s, noom_uint_t start, noomL_Token* token) {
+ const char* str = s + start;
+
+ if (str[0] == '\0') {
+ token->type = NOOML_TOKEN_EOF;
+ token->offset = start;
+ token->length = 0;
+
+ return NOOML_ERROR_NONE;
+ }
+
+ if (noomL_iswhitespace(str[0])) {
+ token->type = NOOML_TOKEN_WHITESPACE; // TODO: maybe handle multiple at once? for now it should be okay
+ token->offset = start;
+ token->length = 1;
+
+ return NOOML_ERROR_NONE;
+ }
+
+ if (str[0] == '_' || noomL_isalpha(str[0])) { // TODO: maybe abstract into function for "can start ident"?
+ noom_uint_t len = 1;
+ while (str[len] == '_' || noomL_isalphanum(str[len])) // same here
+ len++;
+
+ token->type = NOOML_TOKEN_IDENTIFIER;
+ if (noomL_iskeyword(str, len)) token->type = NOOML_TOKEN_KEYWORD;
+
+ token->offset = start;
+ token->length = len;
+
+ return NOOML_ERROR_NONE;
+ }
+
+ {
+ noom_uint_t symbolLen = noomL_getsymbol(str);
+
+ if (symbolLen) {
+ token->type = NOOML_TOKEN_SYMBOL;
+ token->offset = start;
+ token->length = symbolLen;
+
+ return NOOML_ERROR_NONE;
+ }
+ }
+
+ {
+ noom_uint_t numberLen = noomL_getnumber(str);
+
+ if (numberLen) {
+ token->type = NOOML_TOKEN_NUMBER;
+ token->offset = start;
+ token->length = numberLen;
+
+ return NOOML_ERROR_NONE;
+ }
+ }
+
+ // god damn it we errorrreed
+ return NOOML_ERROR_UNKNOWN;
+}
+
diff --git a/src/lexer.h b/src/lexer.h
new file mode 100644
index 0000000..143be59
--- /dev/null
+++ b/src/lexer.h
@@ -0,0 +1,36 @@
+#include "types.h"
+
+typedef enum noomL_TokenType {
+ NOOML_TOKEN_EOF = 0,
+ NOOML_TOKEN_KEYWORD,
+ NOOML_TOKEN_WHITESPACE,
+ NOOML_TOKEN_IDENTIFIER,
+ NOOML_TOKEN_STRING,
+ NOOML_TOKEN_SYMBOL,
+ NOOML_TOKEN_NUMBER,
+
+ NOOML_TOKEN_TCOUNT,
+} noomL_TokenType;
+
+typedef enum noomL_ErrorType {
+ NOOML_ERROR_NONE = 0,
+ NOOML_ERROR_UNKNOWN = 1,
+} noomL_ErrorType;
+
+typedef struct noomL_Token {
+ noomL_TokenType type;
+ noom_uint_t offset;
+ noom_uint_t length;
+} noomL_Token;
+
+
+int noomL_isalpha(char c);
+int noomL_isnumber(char c);
+int noomL_isalphanum(char c);
+int noomL_iswhitespace(char c);
+
+noom_uint_t noomL_getsymbol(const char* s);
+noom_uint_t noomL_getnumber(const char* s);
+
+noomL_ErrorType noomL_lex(const char* s, noom_uint_t start, noomL_Token* token); // TODO: add more error data
+
diff --git a/src/main.c b/src/main.c
new file mode 100644
index 0000000..d5a9f07
--- /dev/null
+++ b/src/main.c
@@ -0,0 +1,24 @@
+#include // for now
+#include "lexer.h"
+
+int main(int argc, char** argv) {
+ // uhh uhhh uhhhhh
+ const char* code = "local a = 5;";
+ noom_uint_t pos = 0;
+
+ noomL_Token token;
+ while (1) {
+ noomL_lex(code, pos, &token);
+
+ printf("%d ", token.type);
+ for (noom_uint_t i = 0; i < token.length; i++) putchar((code + token.offset)[i]);
+ putchar('\n');
+
+ pos += token.length;
+
+ if (token.type == NOOML_TOKEN_EOF) break;
+ }
+
+
+ return 0;
+}
diff --git a/src/types.h b/src/types.h
new file mode 100644
index 0000000..a9b50cb
--- /dev/null
+++ b/src/types.h
@@ -0,0 +1 @@
+typedef unsigned long int noom_uint_t;