diff options
author | Clyne Sullivan <clyne@bitgloo.com> | 2023-11-13 22:04:32 -0500 |
---|---|---|
committer | Clyne Sullivan <clyne@bitgloo.com> | 2023-11-13 22:04:32 -0500 |
commit | ebbde43fa98315a57a15650944f80757f9652b9b (patch) | |
tree | 71fb83ce0d0e7f1b03959f2ddb0663bc2e142578 /libalee | |
parent | 23d746d646adb6b11fa7758a2490ff955c8a9b91 (diff) | |
parent | 0810456e9c5c19a47511a682eeabc71008632a2c (diff) |
Merge branch 'documentation'
Diffstat (limited to 'libalee')
-rw-r--r-- | libalee/corewords.cpp | 152 | ||||
-rw-r--r-- | libalee/corewords.hpp | 90 | ||||
-rw-r--r-- | libalee/ctype.hpp | 46 | ||||
-rw-r--r-- | libalee/dictionary.cpp | 12 | ||||
-rw-r--r-- | libalee/dictionary.hpp | 200 | ||||
-rw-r--r-- | libalee/parser.cpp | 14 | ||||
-rw-r--r-- | libalee/parser.hpp | 79 | ||||
-rw-r--r-- | libalee/state.hpp | 117 | ||||
-rw-r--r-- | libalee/types.hpp | 116 |
9 files changed, 543 insertions, 283 deletions
diff --git a/libalee/corewords.cpp b/libalee/corewords.cpp index b768163..7c79aea 100644 --- a/libalee/corewords.cpp +++ b/libalee/corewords.cpp @@ -20,22 +20,9 @@ #include <utility> -LIBALEE_SECTION -void find(State& state, Word word) -{ - Cell tok = 0; - Cell imm = 0; - - if (auto j = state.dict.find(word); j > 0) { - tok = state.dict.getexec(j); - imm = (state.dict.read(j) & Dictionary::Immediate) ? 1 : -1; - } else if (tok = CoreWords::findi(state, word); tok >= 0) { - imm = (tok == CoreWords::Semicolon) ? 1 : -1; - } - - state.push(tok); - state.push(imm); -} +static void find(State&, Word); +static DoubleCell popd(State&); +static void pushd(State&, DoubleCell); LIBALEE_SECTION void CoreWords::run(Cell ins, State& state) @@ -44,21 +31,8 @@ void CoreWords::run(Cell ins, State& state) DoubleCell dcell; Addr index = ins; - auto& ip = state.ip(); - auto popd = [](State& s) { - DoubleCell dcell = s.pop(); - dcell <<= sizeof(Cell) * 8; - dcell |= static_cast<Addr>(s.pop()); - return dcell; - }; - - auto pushd = [](State& s, DoubleCell d) { - s.push(static_cast<Cell>(d)); - s.push(static_cast<Cell>(d >> (sizeof(Cell) * 8))); - }; - execute: if (index >= Dictionary::Begin) { // must be calling a defined subroutine @@ -66,95 +40,95 @@ execute: ip = index; return; } else switch (index) { - case 0: // _lit + case token("_lit"): // Execution semantics of `literal`. state.push(state.beyondip()); break; - case 1: // drop + case token("drop"): state.pop(); break; - case 2: // dup + case token("dup"): state.push(state.top()); break; - case 3: // swap + case token("swap"): std::swap(state.top(), state.pick(1)); break; - case 4: // pick + case token("pick"): state.push(state.pick(state.pop())); break; - case 5: // sys + case token("sys"): // Calls user-defined "system" handler. user_sys(state); break; - case 6: // add + case token("+"): cell = state.pop(); state.top() += cell; break; - case 7: // sub + case token("-"): cell = state.pop(); state.top() -= cell; break; - case 8: // mul ( n n -- d ) + case token("m*"): // ( n n -- d ) cell = state.pop(); dcell = state.pop() * cell; pushd(state, dcell); break; - case 9: // div ( d n -- n ) + case token("_/"): // ( d n -- n ) cell = state.pop(); dcell = popd(state); state.push(static_cast<Cell>(dcell / cell)); break; - case 10: // mod ( d n -- n ) + case token("_%"): // ( d n -- n ) cell = state.pop(); dcell = popd(state); state.push(static_cast<Cell>(dcell % cell)); break; - case 11: // peek + case token("_@"): // ( addr cell? -- n ) if (state.pop()) state.push(state.dict.read(state.pop())); else state.push(state.dict.readbyte(state.pop())); break; - case 12: // poke + case token("_!"): // ( n addr cell? -- ) cell = state.pop(); if (auto addr = state.pop(); cell) state.dict.write(addr, state.pop()); else state.dict.writebyte(addr, state.pop() & 0xFFu); break; - case 13: // pushr + case token(">r"): state.pushr(state.pop()); break; - case 14: // popr + case token("r>"): state.push(state.popr()); break; - case 15: // equal + case token("="): cell = state.pop(); state.top() = state.top() == cell ? -1 : 0; break; - case 16: // lt + case token("<"): cell = state.pop(); state.top() = state.top() < cell ? -1 : 0; break; - case 17: // and + case token("&"): cell = state.pop(); state.top() &= cell; break; - case 18: // or + case token("|"): cell = state.pop(); state.top() |= cell; break; - case 19: // xor + case token("^"): cell = state.pop(); state.top() ^= cell; break; - case 20: // shl + case token("<<"): cell = state.pop(); reinterpret_cast<Addr&>(state.top()) <<= static_cast<Addr>(cell); break; - case 21: // shr + case token(">>"): cell = state.pop(); reinterpret_cast<Addr&>(state.top()) >>= static_cast<Addr>(cell); break; - case 22: // colon + case token(":"): // Begins definition/compilation of new word. state.push(state.dict.alignhere()); state.dict.write(Dictionary::CompToken, state.top()); while (!state.dict.hasInput()) @@ -162,50 +136,53 @@ execute: state.dict.addDefinition(state.dict.input()); state.compiling(true); break; - case 23: // tick + case token("_'"): // Collects input word and finds execution token. while (!state.dict.hasInput()) state.input(); find(state, state.dict.input()); break; - case 24: // execute + case token("execute"): index = state.pop(); goto execute; - case 25: // exit + case token("exit"): ip = state.popr(); state.verify(ip != 0, Error::exit); break; - case 26: // semic - state.dict.add(findi("exit")); + case token(";"): // Concludes word definition. + state.dict.add(token("exit")); state.compiling(false); cell = state.pop(); dcell = cell - state.dict.latest(); - if (dcell > (1 << (sizeof(Cell) * 8 - 6)) - 1) { - state.dict.write(static_cast<Addr>(cell) + sizeof(Cell), static_cast<Cell>(dcell)); - dcell = ((1 << (sizeof(Cell) * 8 - 6)) - 1); + if (dcell >= Dictionary::MaxDistance) { + // Large distance to previous entry: store in dedicated cell. + state.dict.write(static_cast<Addr>(cell) + sizeof(Cell), + static_cast<Cell>(dcell)); + dcell = Dictionary::MaxDistance; } - state.dict.write(cell, (state.dict.read(cell) & 0x1F) | static_cast<Cell>(dcell << 6)); + state.dict.write(cell, + (state.dict.read(cell) & 0x1F) | static_cast<Cell>(dcell << 6)); state.dict.latest(cell); break; - case 27: // _jmp0 + case token("_jmp0"): // Jump if popped value equals zero. if (state.pop()) { state.beyondip(); break; } [[fallthrough]]; - case 28: // _jmp + case token("_jmp"): // Unconditional jump. ip = state.beyondip(); return; - case 29: // depth + case token("depth"): state.push(static_cast<Cell>(state.size())); break; - case 30: // _rdepth + case token("_rdepth"): state.push(static_cast<Cell>(state.rsize())); break; - case 31: // _in + case token("_in"): // Fetches more input from the user input source. state.input(); break; - case 32: // _ex + case token("_ev"): // Evaluates words from current input source. { const auto st = state.save(); ip = 0; @@ -213,13 +190,13 @@ execute: state.load(st); } break; - case 33: // find + case token("find"): cell = state.pop(); find(state, Word::fromLength(static_cast<Addr>(cell + 1), state.dict.readbyte(cell))); break; - case 34: // _uma + case token("_uma"): // ( d u u -- d ): Unsigned multiply-add. { const auto plus = state.pop(); cell = state.pop(); @@ -229,12 +206,12 @@ execute: pushd(state, dcell); } break; - case 35: // u< + case token("u<"): cell = state.pop(); state.top() = static_cast<Addr>(state.top()) < static_cast<Addr>(cell) ? -1 : 0; break; - case 36: // um/mod + case token("um/mod"): cell = state.pop(); dcell = popd(state); @@ -245,7 +222,7 @@ execute: static_cast<DoubleAddr>(dcell) / static_cast<Addr>(cell))); break; - default: + default: // Compacted literals (WordCount <= ins < Begin). state.push(ins - WordCount); break; } @@ -259,3 +236,34 @@ Cell CoreWords::findi(State& state, Word word) return findi(word.begin(&state.dict), word.size()); } +LIBALEE_SECTION +void find(State& state, Word word) +{ + Cell tok = 0; + Cell imm = 0; + + if (auto j = state.dict.find(word); j > 0) { + tok = state.dict.getexec(j); + imm = (state.dict.read(j) & Dictionary::Immediate) ? 1 : -1; + } else if (tok = CoreWords::findi(state, word); tok >= 0) { + imm = (tok == CoreWords::token(";")) ? 1 : -1; + } + + state.push(tok); + state.push(imm); +} + +DoubleCell popd(State& s) +{ + DoubleCell dcell = s.pop(); + dcell <<= sizeof(Cell) * 8; + dcell |= static_cast<Addr>(s.pop()); + return dcell; +} + +void pushd(State& s, DoubleCell d) +{ + s.push(static_cast<Cell>(d)); + s.push(static_cast<Cell>(d >> (sizeof(Cell) * 8))); +} + diff --git a/libalee/corewords.hpp b/libalee/corewords.hpp index f4ab851..30d0a42 100644 --- a/libalee/corewords.hpp +++ b/libalee/corewords.hpp @@ -1,54 +1,78 @@ -/** - * Alee Forth: A portable and concise Forth implementation in modern C++. - * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> - * - * This program is free software: you can redistribute it and/or modify - * it under the terms of the GNU Lesser General Public License as published by - * the Free Software Foundation, either version 3 of the License, or - * (at your option) any later version. - * - * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU Lesser General Public License for more details. - * - * You should have received a copy of the GNU Lesser General Public License - * along with this program. If not, see <https://www.gnu.org/licenses/>. - */ +// +/// @file corewords.hpp +/// @brief Manages the fundamental word-set and its execution. +// +// Alee Forth: A portable and concise Forth implementation in modern C++. +// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> +// +// This program is free software: you can redistribute it and/or modify +// it under the terms of the GNU Lesser General Public License as published by +// the Free Software Foundation, either version 3 of the License, or +// (at your option) any later version. +// +// This program is distributed in the hope that it will be useful, +// but WITHOUT ANY WARRANTY; without even the implied warranty of +// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +// GNU Lesser General Public License for more details. +// +// You should have received a copy of the GNU Lesser General Public License +// along with this program. If not, see <https://www.gnu.org/licenses/>. #ifndef ALEEFORTH_COREWORDS_HPP #define ALEEFORTH_COREWORDS_HPP #include "config.hpp" -#include "types.hpp" #include "dictionary.hpp" +#include "types.hpp" + +#include <algorithm> + +class State; /** * To be implemented by the user, this function is called when the `sys` word * is executed. + * @param state Current execution state object. */ -void user_sys(State&); +void user_sys(State& state); +/** + * @class CoreWords + * @brief Provides the fundamental word-set and manages its execution. + */ class CoreWords { public: - constexpr static Cell WordCount = 37; - constexpr static Cell Semicolon = 26; + /** + * Searches for the token/index of the given word if it is part of the + * fundamental word-set. + * @param state Current execution state object. + * @param word Word (stored in state's dictionary memory) to look up. + * @return The token/index of the word or -1 if not found. + */ + static Cell findi(State& state, Word word); /** - * Finds execution token that corresponds to the given word. - * Returns -1 if not found. + * Looks up the token/index of the given fundamental word. + * Primarily used for compile-time lookup. + * @param word The word to look up. + * @return The token/index of the word or -1 if not found. */ - static Cell findi(State&, Word); - consteval static Cell findi(const char *word) { + consteval static Cell token(const char *word) { return findi(word, strlen(word)); } /** - * Executes the given CoreWord execution token using the given state. + * Executes the given execution token using the given state. + * @param token Any valid execution token (word, fundamental, constant...). + * @param state The state object to execute with. */ - static void run(Cell, State&); + static void run(Cell token, State& state); + /** + * String lookup table for the fundamental word-set. + * This also determines the opcode (index) of these words. + */ constexpr static char wordsarr[] = "_lit\0drop\0dup\0swap\0pick\0sys\0" "+\0-\0m*\0_/\0_%\0" @@ -59,7 +83,19 @@ public: "depth\0_rdepth\0_in\0_ev\0find\0" "_uma\0u<\0um/mod\0"; + /** + * Count of total fundamental words. + */ + constexpr static Cell WordCount = [] { + return std::count(wordsarr, wordsarr + sizeof(wordsarr), '\0'); }(); + private: + /** + * Generic implementation of findi(). Private; use public implementations. + * @param it Beginning iterator of the word to search for. + * @param size Size of the searched-for word i.e. end == it + size. + * @return The token/index of the word or -1 if not found. + */ template<typename Iter> LIBALEE_SECTION constexpr static Cell findi(Iter it, std::size_t size) diff --git a/libalee/ctype.hpp b/libalee/ctype.hpp index b0df174..f7ce3fb 100644 --- a/libalee/ctype.hpp +++ b/libalee/ctype.hpp @@ -1,52 +1,56 @@ -/** - * Alee Forth: A portable and concise Forth implementation in modern C++. - * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> - * - * This program is free software: you can redistribute it and/or modify - * it under the terms of the GNU Lesser General Public License as published by - * the Free Software Foundation, either version 3 of the License, or - * (at your option) any later version. - * - * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU Lesser General Public License for more details. - * - * You should have received a copy of the GNU Lesser General Public License - * along with this program. If not, see <https://www.gnu.org/licenses/>. - */ +// +/// @file ctype.hpp +/// @brief Simple implementations of character comparison functions. +// +// Alee Forth: A portable and concise Forth implementation in modern C++. +// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> +// +// This program is free software: you can redistribute it and/or modify +// it under the terms of the GNU Lesser General Public License as published by +// the Free Software Foundation, either version 3 of the License, or +// (at your option) any later version. +// +// This program is distributed in the hope that it will be useful, +// but WITHOUT ANY WARRANTY; without even the implied warranty of +// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +// GNU Lesser General Public License for more details. +// +// You should have received a copy of the GNU Lesser General Public License +// along with this program. If not, see <https://www.gnu.org/licenses/>. #ifndef ALEEFORTH_CTYPE_HPP #define ALEEFORTH_CTYPE_HPP -/** - * We implement our own character comparison functions to keep them lean. - */ - #include <cstdint> +/** Determines the length of a null-terminated string. */ constexpr inline unsigned strlen(const char * const s) { unsigned i = 0; while (s[i]) i++; return i; } +/** Tests if given character represents whitespace. */ constexpr inline bool isspace(uint8_t c) { return c == ' ' || c == '\t' || c == '\r' || c == '\n'; } +/** Tests if given character is a numerical digit. */ constexpr inline bool isdigit(uint8_t c) { return c >= '0' && c <= '9'; } +/** Tests if given character is an uppercase letter. */ constexpr inline bool isupper(uint8_t c) { return c >= 'A' && c <= 'Z'; } +/** Tests if given character is a lowercase letter. */ constexpr inline bool islower(uint8_t c) { return c >= 'a' && c <= 'z'; } +/** Tests if given character is a letter. */ constexpr inline bool isalpha(uint8_t c) { return isupper(c) || (c >= 'a' && c <= 'z'); } diff --git a/libalee/dictionary.cpp b/libalee/dictionary.cpp index b98b312..b1cbc5f 100644 --- a/libalee/dictionary.cpp +++ b/libalee/dictionary.cpp @@ -37,7 +37,7 @@ Addr Dictionary::allot(Cell amount) noexcept if (neww < capacity()) { write(Here, static_cast<Addr>(neww)); } else { - // TODO + // TODO how to handle allot failure? Error code? } return old; @@ -68,7 +68,7 @@ void Dictionary::addDefinition(Word word) noexcept Cell wsize = word.size(); add(wsize); - if (alignhere() - latest() >= ((1 << (sizeof(Cell) * 8 - 6)) - 1)) + if (alignhere() - latest() >= MaxDistance) add(0); auto addr = allot(wsize); @@ -91,7 +91,7 @@ Addr Dictionary::find(Word word) noexcept const Addr len = l & 0x1F; Word lw; - if ((l >> 6) < 1023) { + if ((l >> 6) < MaxDistance) { lw = Word::fromLength(lt + sizeof(Cell), len); if (equal(word, lw)) return lt; @@ -120,7 +120,7 @@ Addr Dictionary::getexec(Addr addr) noexcept const Addr len = l & 0x1Fu; addr += sizeof(Cell); - if ((l >> 6) == 1023) + if ((l >> 6) == MaxDistance) addr += sizeof(Cell); addr += len; @@ -132,7 +132,7 @@ bool Dictionary::hasInput() const noexcept { const Addr src = read(Dictionary::Source); const Addr end = read(Dictionary::SourceLen); - uint8_t idx = read(Dictionary::Input) & 0xFFu; + auto idx = static_cast<uint8_t>(read(Dictionary::Input)); while (idx < end) { auto ch = readbyte(src + idx); @@ -154,7 +154,7 @@ Word Dictionary::input() noexcept { const Addr src = read(Dictionary::Source); const Addr end = read(Dictionary::SourceLen); - uint8_t idx = read(Dictionary::Input) & 0xFFu; + auto idx = static_cast<uint8_t>(read(Dictionary::Input)); Addr wstart = src + idx; Addr wend = wstart; diff --git a/libalee/dictionary.hpp b/libalee/dictionary.hpp index 27edf68..ad1ee02 100644 --- a/libalee/dictionary.hpp +++ b/libalee/dictionary.hpp @@ -1,20 +1,22 @@ -/** - * Alee Forth: A portable and concise Forth implementation in modern C++. - * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> - * - * This program is free software: you can redistribute it and/or modify - * it under the terms of the GNU Lesser General Public License as published by - * the Free Software Foundation, either version 3 of the License, or - * (at your option) any later version. - * - * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU Lesser General Public License for more details. - * - * You should have received a copy of the GNU Lesser General Public License - * along with this program. If not, see <https://www.gnu.org/licenses/>. - */ +// +/// @file dictionary.hpp +/// @brief Defines the dictionary interface and common functionality. +// +// Alee Forth: A portable and concise Forth implementation in modern C++. +// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> +// +// This program is free software: you can redistribute it and/or modify +// it under the terms of the GNU Lesser General Public License as published by +// the Free Software Foundation, either version 3 of the License, or +// (at your option) any later version. +// +// This program is distributed in the hope that it will be useful, +// but WITHOUT ANY WARRANTY; without even the implied warranty of +// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +// GNU Lesser General Public License for more details. +// +// You should have received a copy of the GNU Lesser General Public License +// along with this program. If not, see <https://www.gnu.org/licenses/>. #ifndef ALEEFORTH_DICTIONARY_HPP #define ALEEFORTH_DICTIONARY_HPP @@ -28,106 +30,179 @@ #include <cstdint> /** - * Dictionary entry format: - * - 1 information byte - * bits 0..4: Length of name (L) - * bit 5: Immediate? - * bits 6..15: Distance to next entry (negative) - * - L bytes of name - * - 0+ bytes for address alignment - * - 0+ bytes of entry's data... + * @class Dictionary + * @brief Provides an interface and essential funcitonality for a dictionary. + * @details The core read and write functionality is left virtual so that + * dictionaries can be stored in any medium. So, this class cannot be used + * directly; the programmer must define a dictionary class that inherits this + * one. + * + * Dictionary entry format (for a 16-bit implementation): + * - One information cell: + * - bits 0..4: Length of name + * - bit 5: Set if word is immediate + * - bits 6..15: Distance (backwards) to the next entry + * - If bits 6..15 are all one-bits then "long" distance in following cell. + * - "Length" bytes of name + * - Zero or more bytes for address alignment + * - Zero or more bytes of the definition's contents */ - -struct Dictionary +class Dictionary { - /** - * The beginning of the dictionary is used for "internal" variables. - */ +public: + /** Stores Numerical base to use for input/output. */ constexpr static Addr Base = 0; + /** Stores the current `here` address. */ constexpr static Addr Here = sizeof(Cell); + /** Stores the address of the most recently defined word. */ constexpr static Addr Latest = sizeof(Cell) * 2; + /** Stores a boolean indication of compiling state. */ constexpr static Addr Compiling = sizeof(Cell) * 3; + /** Stores the address of the last execution token determined by colon. */ constexpr static Addr CompToken = sizeof(Cell) * 4; + /** Stores the address of the current interpreter input source. */ constexpr static Addr Source = sizeof(Cell) * 5; + /** Stores the size in bytes of the interpreter input source. */ constexpr static Addr SourceLen = sizeof(Cell) * 6; - constexpr static Addr Input = sizeof(Cell) * 7; // len data... - constexpr static Addr InputCells = 80; // bytes! + /** Stores the dictionary's input buffer (a counted string). */ + constexpr static Addr Input = sizeof(Cell) * 7; + /** Stores the size of the dictionary's input buffer in bytes. */ + constexpr static Addr InputCells = 80; + /** Stores the dictionary's "beginning" i.e. where new definitions begin. */ constexpr static Addr Begin = sizeof(Cell) * 8 + InputCells; + /** "Immediate" marker bit for a word's definition. */ constexpr static Cell Immediate = (1 << 5); + /** Maximum "short" distance between two definitions. */ + constexpr static Cell MaxDistance = (1 << (sizeof(Cell) * 8 - 6)) - 1; - /** - * Dictionary data can be stored on any read-write interface. - * You must create a dictionary class that inherits Dictionary and - * implement these functions. See `memdict.hpp` for a simple block-of- - * memory implementation. - */ + /** Returns the value of the cell at the given address. */ virtual Cell read(Addr) const noexcept = 0; + + /** Writes the given value to the cell at the given address. */ virtual void write(Addr, Cell) noexcept = 0; + + /** Returns the byte stored at the given address. */ virtual uint8_t readbyte(Addr) const noexcept = 0; + + /** Writes the given byte to the given address. */ virtual void writebyte(Addr, uint8_t) noexcept = 0; + + /** Returns the total capacity of the dictionary in bytes. */ virtual unsigned long int capacity() const noexcept = 0; /** - * Does initial dictionary setup, required before use for execution. + * Initializes essential dictionary values. + * Must be called before dictionary use. */ void initialize(); + /** + * Gets the address stored in `here`. + */ LIBALEE_SECTION Addr here() const noexcept { return read(Here); } + + /** + * Sets the address stored in `here`. + */ LIBALEE_SECTION void here(Addr l) noexcept { write(Here, l); } + /** + * Gets the value of `latest`. + */ LIBALEE_SECTION Addr latest() const noexcept { return read(Latest); } + + /** + * Sets the value of `latest`. + */ LIBALEE_SECTION void latest(Addr l) noexcept { write(Latest, l); } - // Aligns the given address. - static Addr aligned(Addr); - // Aligns `here`. + /** + * Aligns the given address to the next Cell boundary if necessary. + * @param addr The address to align. + * @return The resulting aligned address. + */ + static Addr aligned(Addr addr); + + /** + * Aligns `here` to the next Cell boundary if necessary. + * @return The new aligned address stored in `here`. + */ Addr alignhere() noexcept; - // Advances `here` by the given number of bytes. - Addr allot(Cell) noexcept; - // Stores value to `here`, then adds sizeof(Cell) to `here`. - void add(Cell) noexcept; /** - * Uses add() to store a new definition entry starting at `here`. - * The entry does not become active until a semicolon is executed. + * Allocates memory by returning and then increasing the current `here`. + * @param count The number of bytes to increase `here` by. + * @return The address stored in `here` before the increase. */ - void addDefinition(Word) noexcept; + Addr allot(Cell count) noexcept; + + /** + * Stores the given value to `here` then calls allot to "save" that cell. + * @param value The value to store. + * @see allot(Cell) + */ + void add(Cell value) noexcept; + + /** + * Stores the beginning of a new word definition in the dictionary. + * The word must eventually have its definition concluded via semicolon. + * @param word The dictionary-stored name of the new word. + */ + void addDefinition(Word word) noexcept; /** * Searches the dictionary for an entry for the given word. - * Returns zero if not found. + * @param word The dictionary-stored word to search for. + * @return The beginning address of the word or zero if not found. */ - Addr find(Word) noexcept; + Addr find(Word word) noexcept; /** - * Given the address of a dictionary entry, produces the execution token - * for that entry. + * Produces the execution token for the given dictionary entry. + * @param addr The beginning address of a defined word. + * @return The execution token for the given word. + * @see find(Word) */ - Addr getexec(Addr) noexcept; + Addr getexec(Addr addr) noexcept; /** * Reads the next word from the input buffer. - * Returns an empty word if the buffer is empty or entirely read. + * @return The next word or an empty word if one is not available. */ Word input() noexcept; + + /** + * Returns true if the dictionary's input buffer has immediately available + * data. + */ bool hasInput() const noexcept; /** - * Checks if this dictionary's word is equivalent to the given string/size. + * Checks if the dictionary-stored word is equivalent to the given string. + * @param word Dictionary-stored word to compare against. + * @param str String to compare to. + * @param size Size of the string to compare to. + * @return True if the two words are equivalent. */ - bool equal(Word, const char *, unsigned) const noexcept; + bool equal(Word word, const char *str, unsigned size) const noexcept; /** - * Checks if two words in this dictionary's word are equivalent. + * Checks if two words stored in this dictionary are equivalent. + * @param word1 First word to compare + * @param word2 Second word to compare + * @return True if the words are equivalent. */ - bool equal(Word, Word) const noexcept; + bool equal(Word word1, Word word2) const noexcept; - // Used for case-insensitive comparison between two iterators. + /** + * Generic equality comparison using our own case-insensitive comparator. + * Arguments and return value identical to std::equal. + */ template<typename Iter1, typename Iter2> LIBALEE_SECTION constexpr static bool equal(Iter1 b1, Iter1 e1, Iter2 b2) { @@ -137,7 +212,10 @@ struct Dictionary virtual ~Dictionary() {}; private: - // Case-insensitive comparison. + /** + * Case-insensitive character comparison used for dictionary lookup. + * @return True if the characters are equivalent. + */ LIBALEE_SECTION constexpr static bool eqchars(char c1, char c2) { if (isalpha(static_cast<uint8_t>(c1))) diff --git a/libalee/parser.cpp b/libalee/parser.cpp index b3e8211..11aba38 100644 --- a/libalee/parser.cpp +++ b/libalee/parser.cpp @@ -25,14 +25,17 @@ Error Parser::parse(State& state, const char *str) { auto addr = Dictionary::Input; + // Set source and input length const auto len = static_cast<Cell>(strlen(str)); state.dict.write(addr, 0); state.dict.write(Dictionary::SourceLen, len); + // Fill input buffer with string contents addr += sizeof(Cell); while (*str) state.dict.writebyte(addr++, *str++); + // Zero the remaining input buffer while (addr < Dictionary::Input + Dictionary::InputCells) state.dict.writebyte(addr++, '\0'); @@ -54,8 +57,10 @@ LIBALEE_SECTION Error Parser::parseWord(State& state, Word word) { bool imm; - Addr ins = state.dict.find(word); + Addr ins; + // Search order: dictionary, core word-set, number, custom parse. + ins = state.dict.find(word); if (ins == 0) { auto cw = CoreWords::findi(state, word); @@ -67,7 +72,7 @@ Error Parser::parseWord(State& state, Word word) return r; } else { ins = cw; - imm = ins == CoreWords::Semicolon; + imm = ins == CoreWords::token(";"); } } else { imm = state.dict.read(ins) & Dictionary::Immediate; @@ -119,8 +124,11 @@ LIBALEE_SECTION void Parser::processLiteral(State& state, Cell value) { if (state.compiling()) { - constexpr auto ins = CoreWords::findi("_lit"); + constexpr auto ins = CoreWords::token("_lit"); + // Literal compression: opcodes between WordCount and Begin are unused, + // so we assign literals to them to save space. Opcode "WordCount" + // pushes zero to the stack, "WordCount + 1" pushes a one, etc. const Cell maxlit = Dictionary::Begin - CoreWords::WordCount; if (value >= 0 && value < maxlit) value += CoreWords::WordCount; diff --git a/libalee/parser.hpp b/libalee/parser.hpp index 6b50918..7eca656 100644 --- a/libalee/parser.hpp +++ b/libalee/parser.hpp @@ -1,20 +1,22 @@ -/** - * Alee Forth: A portable and concise Forth implementation in modern C++. - * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> - * - * This program is free software: you can redistribute it and/or modify - * it under the terms of the GNU Lesser General Public License as published by - * the Free Software Foundation, either version 3 of the License, or - * (at your option) any later version. - * - * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU Lesser General Public License for more details. - * - * You should have received a copy of the GNU Lesser General Public License - * along with this program. If not, see <https://www.gnu.org/licenses/>. - */ +// +/// @file parser.hpp +/// @brief Provides functions to parse text for interpretation/execution. +// +// Alee Forth: A portable and concise Forth implementation in modern C++. +// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> +// +// This program is free software: you can redistribute it and/or modify +// it under the terms of the GNU Lesser General Public License as published by +// the Free Software Foundation, either version 3 of the License, or +// (at your option) any later version. +// +// This program is distributed in the hope that it will be useful, +// but WITHOUT ANY WARRANTY; without even the implied warranty of +// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +// GNU Lesser General Public License for more details. +// +// You should have received a copy of the GNU Lesser General Public License +// along with this program. If not, see <https://www.gnu.org/licenses/>. #ifndef ALEEFORTH_PARSER_HPP #define ALEEFORTH_PARSER_HPP @@ -25,37 +27,60 @@ #include <string_view> +/** + * @class Parser + * @brief Provides routines for parsing Forth code. + */ class Parser { public: + /** + * Pointer to a user-provided function that + */ static Error (*customParse)(State&, Word); /** - * Parses (and evaluates) the given string using the given state. - * The string is stored in the state's input buffer, then parseSource() - * works through that using parseWord(). parseWord() will compile or - * execute as necessary. + * Parses and evaluates the given string using the given state. + * The string is stored in the state's input buffer before parseSource() + * is called. + * @param state The state to parse and evaluate with. + * @param str The string to parse. + * @return Error token to indicate if parsing was successful. + * @see parseSource(State&) */ - static Error parse(State&, const char *); + static Error parse(State& state, const char *str); /** - * Parses (and evaluates) through the words stored in the state's input - * buffer. + * Parses through and compiles or evaluates the words stored in the state's + * input source. + * @param state The state to parse with. + * @return Error token to indicate if parsing was successful. + * @see parseWord(State&, Word) */ - static Error parseSource(State&); + static Error parseSource(State& state); - static void processLiteral(State&, Cell); + /** + * Parses the given value and either pushes it to the stack or compiles + * that functionality. + * @param state The state to give the value to. + * @param value The value to process. + */ + static void processLiteral(State& state, Cell value); private: /** * Parses the given word using the given state. + * @return Error token to indicate if parsing was successful. */ static Error parseWord(State&, Word); /** * Attempts to parse the given word into a number. + * @param state The state object with the dictionary containing the word. + * @param word The dictionary-stored word (number) to parse. + * @return Error token to indicate if parsing was successful. */ - static Error parseNumber(State&, Word); + static Error parseNumber(State& state, Word word); }; #endif // ALEEFORTH_PARSER_HPP diff --git a/libalee/state.hpp b/libalee/state.hpp index 0ac9a7c..a5e49b5 100644 --- a/libalee/state.hpp +++ b/libalee/state.hpp @@ -1,20 +1,22 @@ -/** - * Alee Forth: A portable and concise Forth implementation in modern C++. - * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> - * - * This program is free software: you can redistribute it and/or modify - * it under the terms of the GNU Lesser General Public License as published by - * the Free Software Foundation, either version 3 of the License, or - * (at your option) any later version. - * - * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU Lesser General Public License for more details. - * - * You should have received a copy of the GNU Lesser General Public License - * along with this program. If not, see <https://www.gnu.org/licenses/>. - */ +// +/// @file state.hpp +/// @brief Provides object to manage execution and interpretation state. +// +// Alee Forth: A portable and concise Forth implementation in modern C++. +// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> +// +// This program is free software: you can redistribute it and/or modify +// it under the terms of the GNU Lesser General Public License as published by +// the Free Software Foundation, either version 3 of the License, or +// (at your option) any later version. +// +// This program is distributed in the hope that it will be useful, +// but WITHOUT ANY WARRANTY; without even the implied warranty of +// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +// GNU Lesser General Public License for more details. +// +// You should have received a copy of the GNU Lesser General Public License +// along with this program. If not, see <https://www.gnu.org/licenses/>. #ifndef ALEEFORTH_STATE_HPP #define ALEEFORTH_STATE_HPP @@ -26,31 +28,53 @@ #include <csetjmp> #include <cstddef> +/** + * Size of the primary data stack, number of cells. + */ constexpr unsigned DataStackSize = 64; + +/** + * Size of the return stack, number of cells. + */ constexpr unsigned ReturnStackSize = 64; +/** + * @class State + * Object to track execution state. + */ class State { + /** Input functions should add input to the input buffer when available. */ using InputFunc = void (*)(State&); + /** Context object that defines a state of execution. */ struct Context { - Addr ip = 0; - std::jmp_buf jmpbuf = {}; + Addr ip = 0; /** Instruction pointer */ + std::jmp_buf jmpbuf = {}; /** setjmp() buffer for exiting execute() */ }; public: + /** Reference to dictionary used by this state. */ Dictionary& dict; + /** + * Constructs a state object that uses the given dictionary and input + * function. + * @param d The dictionary to be used by this state + * @param i The input collection function to be used by this state + */ constexpr State(Dictionary& d, InputFunc i): dict(d), inputfunc(i), context() {} /** - * Begins execution at the given execution token. + * Begins execution starting from the given execution token. * If the token is a CoreWord, this function exits after its execution. * Otherwise, execution continues until the word's execution completes. * Encountering an error will cause this function to exit immediately. + * @param addr The token to be executed + * @return An error token to indicate if execution was successful */ - Error execute(Addr); + Error execute(Addr addr); /** * Clears the data and return stacks, sets ip to zero, and clears the @@ -58,25 +82,30 @@ public: */ void reset(); + /** Returns a reference to the instruction pointer. */ LIBALEE_SECTION Addr& ip() noexcept { return context.ip; } + /** Calls the user input function with this state as the argument. */ LIBALEE_SECTION void input() noexcept { inputfunc(*this); } + /** Returns true if currently in a compiling state. */ bool compiling() const; + /** Sets the compiling state. True if compiling, false if interpreting. */ void compiling(bool); + /** Returns the number of values stored on the data stack. */ std::size_t size() const noexcept; + /** Returns the number of values stored on the return stack. */ std::size_t rsize() const noexcept; /** - * Saves execution state so that a new execution can begin. - * Used for EVALUATE. + * Returns the current execution state. Usually followed by a load() call. */ Context save(); @@ -85,49 +114,77 @@ public: */ void load(const Context&); + /** + * Pushes the given value to the data stack. + */ LIBALEE_SECTION inline void push(Cell value) { verify(dsp < dstack + DataStackSize, Error::push); *dsp++ = value; } + /** + * Pops a value from the data stack and returns that value. + */ LIBALEE_SECTION inline Cell pop() { verify(dsp > dstack, Error::pop); return *--dsp; } + /** + * Pushes the given value to the return stack. + */ LIBALEE_SECTION inline void pushr(Cell value) { verify(rsp < rstack + ReturnStackSize, Error::pushr); *rsp++ = value; } + /** + * Pops a value from the return stack and returns that value. + */ LIBALEE_SECTION inline Cell popr() { verify(rsp > rstack, Error::popr); return *--rsp; } + /** + * Returns the value stored at the current data stack position. + */ LIBALEE_SECTION inline Cell& top() { verify(dsp > dstack, Error::top); return *(dsp - 1); } + /** + * Picks a value currently stored on the data stack. + * @param i Index from current position to fetch from + * @return The value stored at the given index + */ LIBALEE_SECTION inline Cell& pick(std::size_t i) { verify(dsp - i > dstack, Error::pick); return *(dsp - i - 1); } - // Advances the instruction pointer and returns that cell's contents. + /** + * Advances the instruction pointer and returns that cell's contents. + */ LIBALEE_SECTION inline Cell beyondip() { context.ip += sizeof(Cell); return dict.read(context.ip); } + /** + * Asserts the given condition is true, longjmp-ing if false. + * Used as an exception handler and the method of exiting execution. + * @param condition Condition to be tested + * @param error Error code to report via longjmp() on false condition + */ LIBALEE_SECTION inline void verify(bool condition, Error error) { if (!condition) @@ -135,13 +192,13 @@ public: } private: - InputFunc inputfunc; // User-provided function to collect "stdin" input. - Context context; + InputFunc inputfunc; /** User-provided function to collect user input. */ + Context context; /** State's current execution context. */ - Cell dstack[DataStackSize] = {}; - Cell rstack[ReturnStackSize] = {}; - Cell *dsp = dstack; - Cell *rsp = rstack; + Cell dstack[DataStackSize] = {}; /** Data stack */ + Cell rstack[ReturnStackSize] = {}; /** Return stack */ + Cell *dsp = dstack; /** Current data stack position */ + Cell *rsp = rstack; /** Current return stack position */ }; #endif // ALEEFORTH_STATE_HPP diff --git a/libalee/types.hpp b/libalee/types.hpp index 028c490..7b5bb62 100644 --- a/libalee/types.hpp +++ b/libalee/types.hpp @@ -1,20 +1,22 @@ -/** - * Alee Forth: A portable and concise Forth implementation in modern C++. - * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> - * - * This program is free software: you can redistribute it and/or modify - * it under the terms of the GNU Lesser General Public License as published by - * the Free Software Foundation, either version 3 of the License, or - * (at your option) any later version. - * - * This program is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU Lesser General Public License for more details. - * - * You should have received a copy of the GNU Lesser General Public License - * along with this program. If not, see <https://www.gnu.org/licenses/>. - */ +// +/// @file types.hpp +/// @brief Defines common types used throughout Alee Forth. +// +// Alee Forth: A portable and concise Forth implementation in modern C++. +// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com> +// +// This program is free software: you can redistribute it and/or modify +// it under the terms of the GNU Lesser General Public License as published by +// the Free Software Foundation, either version 3 of the License, or +// (at your option) any later version. +// +// This program is distributed in the hope that it will be useful, +// but WITHOUT ANY WARRANTY; without even the implied warranty of +// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +// GNU Lesser General Public License for more details. +// +// You should have received a copy of the GNU Lesser General Public License +// along with this program. If not, see <https://www.gnu.org/licenses/>. #ifndef ALEEFORTH_TYPES_HPP #define ALEEFORTH_TYPES_HPP @@ -22,55 +24,86 @@ #include <cstdint> #include <iterator> -/** - * Configure the below types for your platform. - */ +/** Dictionary address type. Must be equivalent to "unsigned Cell". */ using Addr = uint16_t; +/** Data cell type. Dictionary is basically an array of this type. */ using Cell = int16_t; +/** Double-width cell type. Must be twice the size of Cell. */ using DoubleCell = int32_t; -using DoubleAddr = uint32_t; // Only used for um/mod. +/** Double-width addr type. Must be twice the size of Addr. Used by um/mod. */ +using DoubleAddr = uint32_t; struct Dictionary; struct State; -using Func = void (*)(State&); - +/** + * Error enum to report success or failure of parsing or execution. + */ enum class Error : int { - none = 0, - push, - pop, - pushr, - popr, - top, - pick, - exit, - noword + none = 0, /** No error */ + push, /** Could not push (data stack overflow) */ + pop, /** Could not pop (data stack underflow) */ + pushr, /** Could not push (return stack overflow) */ + popr, /** Could not pop (return stack underflow) */ + top, /** Could not fetch data stack top (data stack underflow) */ + pick, /** Could not pick data stack value (data stack underflow) */ + exit, /** No error, exited from State::execute() */ + noword /** Parsing failed because the word was not found */ }; /** - * Stores the start and past-the-end addresses of a dictionary's word. + * @class Word + * Stores the beginning and end indices of a dictionary-defined word. */ class Word { + /** Beginning (inclusive) index */ Addr start; + /** End (exclusive) index */ Addr wend; public: struct iterator; + /** + * Constructs a word with the given start and end indices. + * @param s Start/beginning index + * @param e (past-the-)end index + */ constexpr explicit Word(Addr s = 0, Addr e = 0): start(s), wend(e) {} + /** + * Constructs a word using beginning index and length. + * @param s Beginning/start index of word + * @param l Count of bytes until end of word + * @return Resulting Word object + */ LIBALEE_SECTION static constexpr Word fromLength(Addr s, Addr l) { return Word(s, s + l); } + /** Returns the size of this word in bytes. */ Addr size() const noexcept; - iterator begin(const Dictionary *); - iterator end(const Dictionary *); - + /** + * Creates a beginning iterator for the word. + * @param dict Pointer to dictionary object containing this word + * @return Iterator pointing to this word's beginning + */ + iterator begin(const Dictionary *dict); + + /** + * Creates an end iterator for the word. + * @param dict Pointer to dictionary object containing this word + * @return Iterator pointing to past-the-end of this word + */ + iterator end(const Dictionary *dict); + + /** + * Forward-iterator for iterating through the letters of this word. + */ struct iterator { using iterator_category = std::input_iterator_tag; using value_type = uint8_t; @@ -78,15 +111,26 @@ public: using reference = void; using difference_type = Cell; + /** Iterator's current address within its containing dictionary. */ Addr addr; + /** Pointer to dictionary that contains this word. */ const Dictionary *dict; + /** + * Constructs a word iterator. + * @param a The address the iterator points to + * @param d The dictionary that contains this word + */ constexpr iterator(Addr a, const Dictionary *d): addr(a), dict(d) {} + /** Prefix increment */ iterator& operator++(); + /** Postfix increment */ iterator operator++(int); + /** Returns value pointed to by iterator */ value_type operator*(); + /** Iterator comparison function (case-insensitive) */ bool operator!=(const iterator&); }; }; |