aboutsummaryrefslogtreecommitdiffstats
path: root/libalee
diff options
context:
space:
mode:
authorClyne Sullivan <clyne@bitgloo.com>2023-11-13 22:04:32 -0500
committerClyne Sullivan <clyne@bitgloo.com>2023-11-13 22:04:32 -0500
commitebbde43fa98315a57a15650944f80757f9652b9b (patch)
tree71fb83ce0d0e7f1b03959f2ddb0663bc2e142578 /libalee
parent23d746d646adb6b11fa7758a2490ff955c8a9b91 (diff)
parent0810456e9c5c19a47511a682eeabc71008632a2c (diff)
Merge branch 'documentation'
Diffstat (limited to 'libalee')
-rw-r--r--libalee/corewords.cpp152
-rw-r--r--libalee/corewords.hpp90
-rw-r--r--libalee/ctype.hpp46
-rw-r--r--libalee/dictionary.cpp12
-rw-r--r--libalee/dictionary.hpp200
-rw-r--r--libalee/parser.cpp14
-rw-r--r--libalee/parser.hpp79
-rw-r--r--libalee/state.hpp117
-rw-r--r--libalee/types.hpp116
9 files changed, 543 insertions, 283 deletions
diff --git a/libalee/corewords.cpp b/libalee/corewords.cpp
index b768163..7c79aea 100644
--- a/libalee/corewords.cpp
+++ b/libalee/corewords.cpp
@@ -20,22 +20,9 @@
#include <utility>
-LIBALEE_SECTION
-void find(State& state, Word word)
-{
- Cell tok = 0;
- Cell imm = 0;
-
- if (auto j = state.dict.find(word); j > 0) {
- tok = state.dict.getexec(j);
- imm = (state.dict.read(j) & Dictionary::Immediate) ? 1 : -1;
- } else if (tok = CoreWords::findi(state, word); tok >= 0) {
- imm = (tok == CoreWords::Semicolon) ? 1 : -1;
- }
-
- state.push(tok);
- state.push(imm);
-}
+static void find(State&, Word);
+static DoubleCell popd(State&);
+static void pushd(State&, DoubleCell);
LIBALEE_SECTION
void CoreWords::run(Cell ins, State& state)
@@ -44,21 +31,8 @@ void CoreWords::run(Cell ins, State& state)
DoubleCell dcell;
Addr index = ins;
-
auto& ip = state.ip();
- auto popd = [](State& s) {
- DoubleCell dcell = s.pop();
- dcell <<= sizeof(Cell) * 8;
- dcell |= static_cast<Addr>(s.pop());
- return dcell;
- };
-
- auto pushd = [](State& s, DoubleCell d) {
- s.push(static_cast<Cell>(d));
- s.push(static_cast<Cell>(d >> (sizeof(Cell) * 8)));
- };
-
execute:
if (index >= Dictionary::Begin) {
// must be calling a defined subroutine
@@ -66,95 +40,95 @@ execute:
ip = index;
return;
} else switch (index) {
- case 0: // _lit
+ case token("_lit"): // Execution semantics of `literal`.
state.push(state.beyondip());
break;
- case 1: // drop
+ case token("drop"):
state.pop();
break;
- case 2: // dup
+ case token("dup"):
state.push(state.top());
break;
- case 3: // swap
+ case token("swap"):
std::swap(state.top(), state.pick(1));
break;
- case 4: // pick
+ case token("pick"):
state.push(state.pick(state.pop()));
break;
- case 5: // sys
+ case token("sys"): // Calls user-defined "system" handler.
user_sys(state);
break;
- case 6: // add
+ case token("+"):
cell = state.pop();
state.top() += cell;
break;
- case 7: // sub
+ case token("-"):
cell = state.pop();
state.top() -= cell;
break;
- case 8: // mul ( n n -- d )
+ case token("m*"): // ( n n -- d )
cell = state.pop();
dcell = state.pop() * cell;
pushd(state, dcell);
break;
- case 9: // div ( d n -- n )
+ case token("_/"): // ( d n -- n )
cell = state.pop();
dcell = popd(state);
state.push(static_cast<Cell>(dcell / cell));
break;
- case 10: // mod ( d n -- n )
+ case token("_%"): // ( d n -- n )
cell = state.pop();
dcell = popd(state);
state.push(static_cast<Cell>(dcell % cell));
break;
- case 11: // peek
+ case token("_@"): // ( addr cell? -- n )
if (state.pop())
state.push(state.dict.read(state.pop()));
else
state.push(state.dict.readbyte(state.pop()));
break;
- case 12: // poke
+ case token("_!"): // ( n addr cell? -- )
cell = state.pop();
if (auto addr = state.pop(); cell)
state.dict.write(addr, state.pop());
else
state.dict.writebyte(addr, state.pop() & 0xFFu);
break;
- case 13: // pushr
+ case token(">r"):
state.pushr(state.pop());
break;
- case 14: // popr
+ case token("r>"):
state.push(state.popr());
break;
- case 15: // equal
+ case token("="):
cell = state.pop();
state.top() = state.top() == cell ? -1 : 0;
break;
- case 16: // lt
+ case token("<"):
cell = state.pop();
state.top() = state.top() < cell ? -1 : 0;
break;
- case 17: // and
+ case token("&"):
cell = state.pop();
state.top() &= cell;
break;
- case 18: // or
+ case token("|"):
cell = state.pop();
state.top() |= cell;
break;
- case 19: // xor
+ case token("^"):
cell = state.pop();
state.top() ^= cell;
break;
- case 20: // shl
+ case token("<<"):
cell = state.pop();
reinterpret_cast<Addr&>(state.top()) <<= static_cast<Addr>(cell);
break;
- case 21: // shr
+ case token(">>"):
cell = state.pop();
reinterpret_cast<Addr&>(state.top()) >>= static_cast<Addr>(cell);
break;
- case 22: // colon
+ case token(":"): // Begins definition/compilation of new word.
state.push(state.dict.alignhere());
state.dict.write(Dictionary::CompToken, state.top());
while (!state.dict.hasInput())
@@ -162,50 +136,53 @@ execute:
state.dict.addDefinition(state.dict.input());
state.compiling(true);
break;
- case 23: // tick
+ case token("_'"): // Collects input word and finds execution token.
while (!state.dict.hasInput())
state.input();
find(state, state.dict.input());
break;
- case 24: // execute
+ case token("execute"):
index = state.pop();
goto execute;
- case 25: // exit
+ case token("exit"):
ip = state.popr();
state.verify(ip != 0, Error::exit);
break;
- case 26: // semic
- state.dict.add(findi("exit"));
+ case token(";"): // Concludes word definition.
+ state.dict.add(token("exit"));
state.compiling(false);
cell = state.pop();
dcell = cell - state.dict.latest();
- if (dcell > (1 << (sizeof(Cell) * 8 - 6)) - 1) {
- state.dict.write(static_cast<Addr>(cell) + sizeof(Cell), static_cast<Cell>(dcell));
- dcell = ((1 << (sizeof(Cell) * 8 - 6)) - 1);
+ if (dcell >= Dictionary::MaxDistance) {
+ // Large distance to previous entry: store in dedicated cell.
+ state.dict.write(static_cast<Addr>(cell) + sizeof(Cell),
+ static_cast<Cell>(dcell));
+ dcell = Dictionary::MaxDistance;
}
- state.dict.write(cell, (state.dict.read(cell) & 0x1F) | static_cast<Cell>(dcell << 6));
+ state.dict.write(cell,
+ (state.dict.read(cell) & 0x1F) | static_cast<Cell>(dcell << 6));
state.dict.latest(cell);
break;
- case 27: // _jmp0
+ case token("_jmp0"): // Jump if popped value equals zero.
if (state.pop()) {
state.beyondip();
break;
}
[[fallthrough]];
- case 28: // _jmp
+ case token("_jmp"): // Unconditional jump.
ip = state.beyondip();
return;
- case 29: // depth
+ case token("depth"):
state.push(static_cast<Cell>(state.size()));
break;
- case 30: // _rdepth
+ case token("_rdepth"):
state.push(static_cast<Cell>(state.rsize()));
break;
- case 31: // _in
+ case token("_in"): // Fetches more input from the user input source.
state.input();
break;
- case 32: // _ex
+ case token("_ev"): // Evaluates words from current input source.
{
const auto st = state.save();
ip = 0;
@@ -213,13 +190,13 @@ execute:
state.load(st);
}
break;
- case 33: // find
+ case token("find"):
cell = state.pop();
find(state,
Word::fromLength(static_cast<Addr>(cell + 1),
state.dict.readbyte(cell)));
break;
- case 34: // _uma
+ case token("_uma"): // ( d u u -- d ): Unsigned multiply-add.
{
const auto plus = state.pop();
cell = state.pop();
@@ -229,12 +206,12 @@ execute:
pushd(state, dcell);
}
break;
- case 35: // u<
+ case token("u<"):
cell = state.pop();
state.top() = static_cast<Addr>(state.top()) <
static_cast<Addr>(cell) ? -1 : 0;
break;
- case 36: // um/mod
+ case token("um/mod"):
cell = state.pop();
dcell = popd(state);
@@ -245,7 +222,7 @@ execute:
static_cast<DoubleAddr>(dcell) /
static_cast<Addr>(cell)));
break;
- default:
+ default: // Compacted literals (WordCount <= ins < Begin).
state.push(ins - WordCount);
break;
}
@@ -259,3 +236,34 @@ Cell CoreWords::findi(State& state, Word word)
return findi(word.begin(&state.dict), word.size());
}
+LIBALEE_SECTION
+void find(State& state, Word word)
+{
+ Cell tok = 0;
+ Cell imm = 0;
+
+ if (auto j = state.dict.find(word); j > 0) {
+ tok = state.dict.getexec(j);
+ imm = (state.dict.read(j) & Dictionary::Immediate) ? 1 : -1;
+ } else if (tok = CoreWords::findi(state, word); tok >= 0) {
+ imm = (tok == CoreWords::token(";")) ? 1 : -1;
+ }
+
+ state.push(tok);
+ state.push(imm);
+}
+
+DoubleCell popd(State& s)
+{
+ DoubleCell dcell = s.pop();
+ dcell <<= sizeof(Cell) * 8;
+ dcell |= static_cast<Addr>(s.pop());
+ return dcell;
+}
+
+void pushd(State& s, DoubleCell d)
+{
+ s.push(static_cast<Cell>(d));
+ s.push(static_cast<Cell>(d >> (sizeof(Cell) * 8)));
+}
+
diff --git a/libalee/corewords.hpp b/libalee/corewords.hpp
index f4ab851..30d0a42 100644
--- a/libalee/corewords.hpp
+++ b/libalee/corewords.hpp
@@ -1,54 +1,78 @@
-/**
- * Alee Forth: A portable and concise Forth implementation in modern C++.
- * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
- *
- * This program is free software: you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation, either version 3 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public License
- * along with this program. If not, see <https://www.gnu.org/licenses/>.
- */
+//
+/// @file corewords.hpp
+/// @brief Manages the fundamental word-set and its execution.
+//
+// Alee Forth: A portable and concise Forth implementation in modern C++.
+// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
+//
+// This program is free software: you can redistribute it and/or modify
+// it under the terms of the GNU Lesser General Public License as published by
+// the Free Software Foundation, either version 3 of the License, or
+// (at your option) any later version.
+//
+// This program is distributed in the hope that it will be useful,
+// but WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+// GNU Lesser General Public License for more details.
+//
+// You should have received a copy of the GNU Lesser General Public License
+// along with this program. If not, see <https://www.gnu.org/licenses/>.
#ifndef ALEEFORTH_COREWORDS_HPP
#define ALEEFORTH_COREWORDS_HPP
#include "config.hpp"
-#include "types.hpp"
#include "dictionary.hpp"
+#include "types.hpp"
+
+#include <algorithm>
+
+class State;
/**
* To be implemented by the user, this function is called when the `sys` word
* is executed.
+ * @param state Current execution state object.
*/
-void user_sys(State&);
+void user_sys(State& state);
+/**
+ * @class CoreWords
+ * @brief Provides the fundamental word-set and manages its execution.
+ */
class CoreWords
{
public:
- constexpr static Cell WordCount = 37;
- constexpr static Cell Semicolon = 26;
+ /**
+ * Searches for the token/index of the given word if it is part of the
+ * fundamental word-set.
+ * @param state Current execution state object.
+ * @param word Word (stored in state's dictionary memory) to look up.
+ * @return The token/index of the word or -1 if not found.
+ */
+ static Cell findi(State& state, Word word);
/**
- * Finds execution token that corresponds to the given word.
- * Returns -1 if not found.
+ * Looks up the token/index of the given fundamental word.
+ * Primarily used for compile-time lookup.
+ * @param word The word to look up.
+ * @return The token/index of the word or -1 if not found.
*/
- static Cell findi(State&, Word);
- consteval static Cell findi(const char *word) {
+ consteval static Cell token(const char *word) {
return findi(word, strlen(word));
}
/**
- * Executes the given CoreWord execution token using the given state.
+ * Executes the given execution token using the given state.
+ * @param token Any valid execution token (word, fundamental, constant...).
+ * @param state The state object to execute with.
*/
- static void run(Cell, State&);
+ static void run(Cell token, State& state);
+ /**
+ * String lookup table for the fundamental word-set.
+ * This also determines the opcode (index) of these words.
+ */
constexpr static char wordsarr[] =
"_lit\0drop\0dup\0swap\0pick\0sys\0"
"+\0-\0m*\0_/\0_%\0"
@@ -59,7 +83,19 @@ public:
"depth\0_rdepth\0_in\0_ev\0find\0"
"_uma\0u<\0um/mod\0";
+ /**
+ * Count of total fundamental words.
+ */
+ constexpr static Cell WordCount = [] {
+ return std::count(wordsarr, wordsarr + sizeof(wordsarr), '\0'); }();
+
private:
+ /**
+ * Generic implementation of findi(). Private; use public implementations.
+ * @param it Beginning iterator of the word to search for.
+ * @param size Size of the searched-for word i.e. end == it + size.
+ * @return The token/index of the word or -1 if not found.
+ */
template<typename Iter>
LIBALEE_SECTION
constexpr static Cell findi(Iter it, std::size_t size)
diff --git a/libalee/ctype.hpp b/libalee/ctype.hpp
index b0df174..f7ce3fb 100644
--- a/libalee/ctype.hpp
+++ b/libalee/ctype.hpp
@@ -1,52 +1,56 @@
-/**
- * Alee Forth: A portable and concise Forth implementation in modern C++.
- * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
- *
- * This program is free software: you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation, either version 3 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public License
- * along with this program. If not, see <https://www.gnu.org/licenses/>.
- */
+//
+/// @file ctype.hpp
+/// @brief Simple implementations of character comparison functions.
+//
+// Alee Forth: A portable and concise Forth implementation in modern C++.
+// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
+//
+// This program is free software: you can redistribute it and/or modify
+// it under the terms of the GNU Lesser General Public License as published by
+// the Free Software Foundation, either version 3 of the License, or
+// (at your option) any later version.
+//
+// This program is distributed in the hope that it will be useful,
+// but WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+// GNU Lesser General Public License for more details.
+//
+// You should have received a copy of the GNU Lesser General Public License
+// along with this program. If not, see <https://www.gnu.org/licenses/>.
#ifndef ALEEFORTH_CTYPE_HPP
#define ALEEFORTH_CTYPE_HPP
-/**
- * We implement our own character comparison functions to keep them lean.
- */
-
#include <cstdint>
+/** Determines the length of a null-terminated string. */
constexpr inline unsigned strlen(const char * const s) {
unsigned i = 0;
while (s[i]) i++;
return i;
}
+/** Tests if given character represents whitespace. */
constexpr inline bool isspace(uint8_t c) {
return c == ' ' || c == '\t' || c == '\r' || c == '\n';
}
+/** Tests if given character is a numerical digit. */
constexpr inline bool isdigit(uint8_t c) {
return c >= '0' && c <= '9';
}
+/** Tests if given character is an uppercase letter. */
constexpr inline bool isupper(uint8_t c) {
return c >= 'A' && c <= 'Z';
}
+/** Tests if given character is a lowercase letter. */
constexpr inline bool islower(uint8_t c) {
return c >= 'a' && c <= 'z';
}
+/** Tests if given character is a letter. */
constexpr inline bool isalpha(uint8_t c) {
return isupper(c) || (c >= 'a' && c <= 'z');
}
diff --git a/libalee/dictionary.cpp b/libalee/dictionary.cpp
index b98b312..b1cbc5f 100644
--- a/libalee/dictionary.cpp
+++ b/libalee/dictionary.cpp
@@ -37,7 +37,7 @@ Addr Dictionary::allot(Cell amount) noexcept
if (neww < capacity()) {
write(Here, static_cast<Addr>(neww));
} else {
- // TODO
+ // TODO how to handle allot failure? Error code?
}
return old;
@@ -68,7 +68,7 @@ void Dictionary::addDefinition(Word word) noexcept
Cell wsize = word.size();
add(wsize);
- if (alignhere() - latest() >= ((1 << (sizeof(Cell) * 8 - 6)) - 1))
+ if (alignhere() - latest() >= MaxDistance)
add(0);
auto addr = allot(wsize);
@@ -91,7 +91,7 @@ Addr Dictionary::find(Word word) noexcept
const Addr len = l & 0x1F;
Word lw;
- if ((l >> 6) < 1023) {
+ if ((l >> 6) < MaxDistance) {
lw = Word::fromLength(lt + sizeof(Cell), len);
if (equal(word, lw))
return lt;
@@ -120,7 +120,7 @@ Addr Dictionary::getexec(Addr addr) noexcept
const Addr len = l & 0x1Fu;
addr += sizeof(Cell);
- if ((l >> 6) == 1023)
+ if ((l >> 6) == MaxDistance)
addr += sizeof(Cell);
addr += len;
@@ -132,7 +132,7 @@ bool Dictionary::hasInput() const noexcept
{
const Addr src = read(Dictionary::Source);
const Addr end = read(Dictionary::SourceLen);
- uint8_t idx = read(Dictionary::Input) & 0xFFu;
+ auto idx = static_cast<uint8_t>(read(Dictionary::Input));
while (idx < end) {
auto ch = readbyte(src + idx);
@@ -154,7 +154,7 @@ Word Dictionary::input() noexcept
{
const Addr src = read(Dictionary::Source);
const Addr end = read(Dictionary::SourceLen);
- uint8_t idx = read(Dictionary::Input) & 0xFFu;
+ auto idx = static_cast<uint8_t>(read(Dictionary::Input));
Addr wstart = src + idx;
Addr wend = wstart;
diff --git a/libalee/dictionary.hpp b/libalee/dictionary.hpp
index 27edf68..ad1ee02 100644
--- a/libalee/dictionary.hpp
+++ b/libalee/dictionary.hpp
@@ -1,20 +1,22 @@
-/**
- * Alee Forth: A portable and concise Forth implementation in modern C++.
- * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
- *
- * This program is free software: you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation, either version 3 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public License
- * along with this program. If not, see <https://www.gnu.org/licenses/>.
- */
+//
+/// @file dictionary.hpp
+/// @brief Defines the dictionary interface and common functionality.
+//
+// Alee Forth: A portable and concise Forth implementation in modern C++.
+// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
+//
+// This program is free software: you can redistribute it and/or modify
+// it under the terms of the GNU Lesser General Public License as published by
+// the Free Software Foundation, either version 3 of the License, or
+// (at your option) any later version.
+//
+// This program is distributed in the hope that it will be useful,
+// but WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+// GNU Lesser General Public License for more details.
+//
+// You should have received a copy of the GNU Lesser General Public License
+// along with this program. If not, see <https://www.gnu.org/licenses/>.
#ifndef ALEEFORTH_DICTIONARY_HPP
#define ALEEFORTH_DICTIONARY_HPP
@@ -28,106 +30,179 @@
#include <cstdint>
/**
- * Dictionary entry format:
- * - 1 information byte
- * bits 0..4: Length of name (L)
- * bit 5: Immediate?
- * bits 6..15: Distance to next entry (negative)
- * - L bytes of name
- * - 0+ bytes for address alignment
- * - 0+ bytes of entry's data...
+ * @class Dictionary
+ * @brief Provides an interface and essential funcitonality for a dictionary.
+ * @details The core read and write functionality is left virtual so that
+ * dictionaries can be stored in any medium. So, this class cannot be used
+ * directly; the programmer must define a dictionary class that inherits this
+ * one.
+ *
+ * Dictionary entry format (for a 16-bit implementation):
+ * - One information cell:
+ * - bits 0..4: Length of name
+ * - bit 5: Set if word is immediate
+ * - bits 6..15: Distance (backwards) to the next entry
+ * - If bits 6..15 are all one-bits then "long" distance in following cell.
+ * - "Length" bytes of name
+ * - Zero or more bytes for address alignment
+ * - Zero or more bytes of the definition's contents
*/
-
-struct Dictionary
+class Dictionary
{
- /**
- * The beginning of the dictionary is used for "internal" variables.
- */
+public:
+ /** Stores Numerical base to use for input/output. */
constexpr static Addr Base = 0;
+ /** Stores the current `here` address. */
constexpr static Addr Here = sizeof(Cell);
+ /** Stores the address of the most recently defined word. */
constexpr static Addr Latest = sizeof(Cell) * 2;
+ /** Stores a boolean indication of compiling state. */
constexpr static Addr Compiling = sizeof(Cell) * 3;
+ /** Stores the address of the last execution token determined by colon. */
constexpr static Addr CompToken = sizeof(Cell) * 4;
+ /** Stores the address of the current interpreter input source. */
constexpr static Addr Source = sizeof(Cell) * 5;
+ /** Stores the size in bytes of the interpreter input source. */
constexpr static Addr SourceLen = sizeof(Cell) * 6;
- constexpr static Addr Input = sizeof(Cell) * 7; // len data...
- constexpr static Addr InputCells = 80; // bytes!
+ /** Stores the dictionary's input buffer (a counted string). */
+ constexpr static Addr Input = sizeof(Cell) * 7;
+ /** Stores the size of the dictionary's input buffer in bytes. */
+ constexpr static Addr InputCells = 80;
+ /** Stores the dictionary's "beginning" i.e. where new definitions begin. */
constexpr static Addr Begin = sizeof(Cell) * 8 + InputCells;
+ /** "Immediate" marker bit for a word's definition. */
constexpr static Cell Immediate = (1 << 5);
+ /** Maximum "short" distance between two definitions. */
+ constexpr static Cell MaxDistance = (1 << (sizeof(Cell) * 8 - 6)) - 1;
- /**
- * Dictionary data can be stored on any read-write interface.
- * You must create a dictionary class that inherits Dictionary and
- * implement these functions. See `memdict.hpp` for a simple block-of-
- * memory implementation.
- */
+ /** Returns the value of the cell at the given address. */
virtual Cell read(Addr) const noexcept = 0;
+
+ /** Writes the given value to the cell at the given address. */
virtual void write(Addr, Cell) noexcept = 0;
+
+ /** Returns the byte stored at the given address. */
virtual uint8_t readbyte(Addr) const noexcept = 0;
+
+ /** Writes the given byte to the given address. */
virtual void writebyte(Addr, uint8_t) noexcept = 0;
+
+ /** Returns the total capacity of the dictionary in bytes. */
virtual unsigned long int capacity() const noexcept = 0;
/**
- * Does initial dictionary setup, required before use for execution.
+ * Initializes essential dictionary values.
+ * Must be called before dictionary use.
*/
void initialize();
+ /**
+ * Gets the address stored in `here`.
+ */
LIBALEE_SECTION
Addr here() const noexcept { return read(Here); }
+
+ /**
+ * Sets the address stored in `here`.
+ */
LIBALEE_SECTION
void here(Addr l) noexcept { write(Here, l); }
+ /**
+ * Gets the value of `latest`.
+ */
LIBALEE_SECTION
Addr latest() const noexcept { return read(Latest); }
+
+ /**
+ * Sets the value of `latest`.
+ */
LIBALEE_SECTION
void latest(Addr l) noexcept { write(Latest, l); }
- // Aligns the given address.
- static Addr aligned(Addr);
- // Aligns `here`.
+ /**
+ * Aligns the given address to the next Cell boundary if necessary.
+ * @param addr The address to align.
+ * @return The resulting aligned address.
+ */
+ static Addr aligned(Addr addr);
+
+ /**
+ * Aligns `here` to the next Cell boundary if necessary.
+ * @return The new aligned address stored in `here`.
+ */
Addr alignhere() noexcept;
- // Advances `here` by the given number of bytes.
- Addr allot(Cell) noexcept;
- // Stores value to `here`, then adds sizeof(Cell) to `here`.
- void add(Cell) noexcept;
/**
- * Uses add() to store a new definition entry starting at `here`.
- * The entry does not become active until a semicolon is executed.
+ * Allocates memory by returning and then increasing the current `here`.
+ * @param count The number of bytes to increase `here` by.
+ * @return The address stored in `here` before the increase.
*/
- void addDefinition(Word) noexcept;
+ Addr allot(Cell count) noexcept;
+
+ /**
+ * Stores the given value to `here` then calls allot to "save" that cell.
+ * @param value The value to store.
+ * @see allot(Cell)
+ */
+ void add(Cell value) noexcept;
+
+ /**
+ * Stores the beginning of a new word definition in the dictionary.
+ * The word must eventually have its definition concluded via semicolon.
+ * @param word The dictionary-stored name of the new word.
+ */
+ void addDefinition(Word word) noexcept;
/**
* Searches the dictionary for an entry for the given word.
- * Returns zero if not found.
+ * @param word The dictionary-stored word to search for.
+ * @return The beginning address of the word or zero if not found.
*/
- Addr find(Word) noexcept;
+ Addr find(Word word) noexcept;
/**
- * Given the address of a dictionary entry, produces the execution token
- * for that entry.
+ * Produces the execution token for the given dictionary entry.
+ * @param addr The beginning address of a defined word.
+ * @return The execution token for the given word.
+ * @see find(Word)
*/
- Addr getexec(Addr) noexcept;
+ Addr getexec(Addr addr) noexcept;
/**
* Reads the next word from the input buffer.
- * Returns an empty word if the buffer is empty or entirely read.
+ * @return The next word or an empty word if one is not available.
*/
Word input() noexcept;
+
+ /**
+ * Returns true if the dictionary's input buffer has immediately available
+ * data.
+ */
bool hasInput() const noexcept;
/**
- * Checks if this dictionary's word is equivalent to the given string/size.
+ * Checks if the dictionary-stored word is equivalent to the given string.
+ * @param word Dictionary-stored word to compare against.
+ * @param str String to compare to.
+ * @param size Size of the string to compare to.
+ * @return True if the two words are equivalent.
*/
- bool equal(Word, const char *, unsigned) const noexcept;
+ bool equal(Word word, const char *str, unsigned size) const noexcept;
/**
- * Checks if two words in this dictionary's word are equivalent.
+ * Checks if two words stored in this dictionary are equivalent.
+ * @param word1 First word to compare
+ * @param word2 Second word to compare
+ * @return True if the words are equivalent.
*/
- bool equal(Word, Word) const noexcept;
+ bool equal(Word word1, Word word2) const noexcept;
- // Used for case-insensitive comparison between two iterators.
+ /**
+ * Generic equality comparison using our own case-insensitive comparator.
+ * Arguments and return value identical to std::equal.
+ */
template<typename Iter1, typename Iter2>
LIBALEE_SECTION
constexpr static bool equal(Iter1 b1, Iter1 e1, Iter2 b2) {
@@ -137,7 +212,10 @@ struct Dictionary
virtual ~Dictionary() {};
private:
- // Case-insensitive comparison.
+ /**
+ * Case-insensitive character comparison used for dictionary lookup.
+ * @return True if the characters are equivalent.
+ */
LIBALEE_SECTION
constexpr static bool eqchars(char c1, char c2) {
if (isalpha(static_cast<uint8_t>(c1)))
diff --git a/libalee/parser.cpp b/libalee/parser.cpp
index b3e8211..11aba38 100644
--- a/libalee/parser.cpp
+++ b/libalee/parser.cpp
@@ -25,14 +25,17 @@ Error Parser::parse(State& state, const char *str)
{
auto addr = Dictionary::Input;
+ // Set source and input length
const auto len = static_cast<Cell>(strlen(str));
state.dict.write(addr, 0);
state.dict.write(Dictionary::SourceLen, len);
+ // Fill input buffer with string contents
addr += sizeof(Cell);
while (*str)
state.dict.writebyte(addr++, *str++);
+ // Zero the remaining input buffer
while (addr < Dictionary::Input + Dictionary::InputCells)
state.dict.writebyte(addr++, '\0');
@@ -54,8 +57,10 @@ LIBALEE_SECTION
Error Parser::parseWord(State& state, Word word)
{
bool imm;
- Addr ins = state.dict.find(word);
+ Addr ins;
+ // Search order: dictionary, core word-set, number, custom parse.
+ ins = state.dict.find(word);
if (ins == 0) {
auto cw = CoreWords::findi(state, word);
@@ -67,7 +72,7 @@ Error Parser::parseWord(State& state, Word word)
return r;
} else {
ins = cw;
- imm = ins == CoreWords::Semicolon;
+ imm = ins == CoreWords::token(";");
}
} else {
imm = state.dict.read(ins) & Dictionary::Immediate;
@@ -119,8 +124,11 @@ LIBALEE_SECTION
void Parser::processLiteral(State& state, Cell value)
{
if (state.compiling()) {
- constexpr auto ins = CoreWords::findi("_lit");
+ constexpr auto ins = CoreWords::token("_lit");
+ // Literal compression: opcodes between WordCount and Begin are unused,
+ // so we assign literals to them to save space. Opcode "WordCount"
+ // pushes zero to the stack, "WordCount + 1" pushes a one, etc.
const Cell maxlit = Dictionary::Begin - CoreWords::WordCount;
if (value >= 0 && value < maxlit)
value += CoreWords::WordCount;
diff --git a/libalee/parser.hpp b/libalee/parser.hpp
index 6b50918..7eca656 100644
--- a/libalee/parser.hpp
+++ b/libalee/parser.hpp
@@ -1,20 +1,22 @@
-/**
- * Alee Forth: A portable and concise Forth implementation in modern C++.
- * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
- *
- * This program is free software: you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation, either version 3 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public License
- * along with this program. If not, see <https://www.gnu.org/licenses/>.
- */
+//
+/// @file parser.hpp
+/// @brief Provides functions to parse text for interpretation/execution.
+//
+// Alee Forth: A portable and concise Forth implementation in modern C++.
+// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
+//
+// This program is free software: you can redistribute it and/or modify
+// it under the terms of the GNU Lesser General Public License as published by
+// the Free Software Foundation, either version 3 of the License, or
+// (at your option) any later version.
+//
+// This program is distributed in the hope that it will be useful,
+// but WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+// GNU Lesser General Public License for more details.
+//
+// You should have received a copy of the GNU Lesser General Public License
+// along with this program. If not, see <https://www.gnu.org/licenses/>.
#ifndef ALEEFORTH_PARSER_HPP
#define ALEEFORTH_PARSER_HPP
@@ -25,37 +27,60 @@
#include <string_view>
+/**
+ * @class Parser
+ * @brief Provides routines for parsing Forth code.
+ */
class Parser
{
public:
+ /**
+ * Pointer to a user-provided function that
+ */
static Error (*customParse)(State&, Word);
/**
- * Parses (and evaluates) the given string using the given state.
- * The string is stored in the state's input buffer, then parseSource()
- * works through that using parseWord(). parseWord() will compile or
- * execute as necessary.
+ * Parses and evaluates the given string using the given state.
+ * The string is stored in the state's input buffer before parseSource()
+ * is called.
+ * @param state The state to parse and evaluate with.
+ * @param str The string to parse.
+ * @return Error token to indicate if parsing was successful.
+ * @see parseSource(State&)
*/
- static Error parse(State&, const char *);
+ static Error parse(State& state, const char *str);
/**
- * Parses (and evaluates) through the words stored in the state's input
- * buffer.
+ * Parses through and compiles or evaluates the words stored in the state's
+ * input source.
+ * @param state The state to parse with.
+ * @return Error token to indicate if parsing was successful.
+ * @see parseWord(State&, Word)
*/
- static Error parseSource(State&);
+ static Error parseSource(State& state);
- static void processLiteral(State&, Cell);
+ /**
+ * Parses the given value and either pushes it to the stack or compiles
+ * that functionality.
+ * @param state The state to give the value to.
+ * @param value The value to process.
+ */
+ static void processLiteral(State& state, Cell value);
private:
/**
* Parses the given word using the given state.
+ * @return Error token to indicate if parsing was successful.
*/
static Error parseWord(State&, Word);
/**
* Attempts to parse the given word into a number.
+ * @param state The state object with the dictionary containing the word.
+ * @param word The dictionary-stored word (number) to parse.
+ * @return Error token to indicate if parsing was successful.
*/
- static Error parseNumber(State&, Word);
+ static Error parseNumber(State& state, Word word);
};
#endif // ALEEFORTH_PARSER_HPP
diff --git a/libalee/state.hpp b/libalee/state.hpp
index 0ac9a7c..a5e49b5 100644
--- a/libalee/state.hpp
+++ b/libalee/state.hpp
@@ -1,20 +1,22 @@
-/**
- * Alee Forth: A portable and concise Forth implementation in modern C++.
- * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
- *
- * This program is free software: you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation, either version 3 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public License
- * along with this program. If not, see <https://www.gnu.org/licenses/>.
- */
+//
+/// @file state.hpp
+/// @brief Provides object to manage execution and interpretation state.
+//
+// Alee Forth: A portable and concise Forth implementation in modern C++.
+// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
+//
+// This program is free software: you can redistribute it and/or modify
+// it under the terms of the GNU Lesser General Public License as published by
+// the Free Software Foundation, either version 3 of the License, or
+// (at your option) any later version.
+//
+// This program is distributed in the hope that it will be useful,
+// but WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+// GNU Lesser General Public License for more details.
+//
+// You should have received a copy of the GNU Lesser General Public License
+// along with this program. If not, see <https://www.gnu.org/licenses/>.
#ifndef ALEEFORTH_STATE_HPP
#define ALEEFORTH_STATE_HPP
@@ -26,31 +28,53 @@
#include <csetjmp>
#include <cstddef>
+/**
+ * Size of the primary data stack, number of cells.
+ */
constexpr unsigned DataStackSize = 64;
+
+/**
+ * Size of the return stack, number of cells.
+ */
constexpr unsigned ReturnStackSize = 64;
+/**
+ * @class State
+ * Object to track execution state.
+ */
class State
{
+ /** Input functions should add input to the input buffer when available. */
using InputFunc = void (*)(State&);
+ /** Context object that defines a state of execution. */
struct Context {
- Addr ip = 0;
- std::jmp_buf jmpbuf = {};
+ Addr ip = 0; /** Instruction pointer */
+ std::jmp_buf jmpbuf = {}; /** setjmp() buffer for exiting execute() */
};
public:
+ /** Reference to dictionary used by this state. */
Dictionary& dict;
+ /**
+ * Constructs a state object that uses the given dictionary and input
+ * function.
+ * @param d The dictionary to be used by this state
+ * @param i The input collection function to be used by this state
+ */
constexpr State(Dictionary& d, InputFunc i):
dict(d), inputfunc(i), context() {}
/**
- * Begins execution at the given execution token.
+ * Begins execution starting from the given execution token.
* If the token is a CoreWord, this function exits after its execution.
* Otherwise, execution continues until the word's execution completes.
* Encountering an error will cause this function to exit immediately.
+ * @param addr The token to be executed
+ * @return An error token to indicate if execution was successful
*/
- Error execute(Addr);
+ Error execute(Addr addr);
/**
* Clears the data and return stacks, sets ip to zero, and clears the
@@ -58,25 +82,30 @@ public:
*/
void reset();
+ /** Returns a reference to the instruction pointer. */
LIBALEE_SECTION
Addr& ip() noexcept {
return context.ip;
}
+ /** Calls the user input function with this state as the argument. */
LIBALEE_SECTION
void input() noexcept {
inputfunc(*this);
}
+ /** Returns true if currently in a compiling state. */
bool compiling() const;
+ /** Sets the compiling state. True if compiling, false if interpreting. */
void compiling(bool);
+ /** Returns the number of values stored on the data stack. */
std::size_t size() const noexcept;
+ /** Returns the number of values stored on the return stack. */
std::size_t rsize() const noexcept;
/**
- * Saves execution state so that a new execution can begin.
- * Used for EVALUATE.
+ * Returns the current execution state. Usually followed by a load() call.
*/
Context save();
@@ -85,49 +114,77 @@ public:
*/
void load(const Context&);
+ /**
+ * Pushes the given value to the data stack.
+ */
LIBALEE_SECTION
inline void push(Cell value) {
verify(dsp < dstack + DataStackSize, Error::push);
*dsp++ = value;
}
+ /**
+ * Pops a value from the data stack and returns that value.
+ */
LIBALEE_SECTION
inline Cell pop() {
verify(dsp > dstack, Error::pop);
return *--dsp;
}
+ /**
+ * Pushes the given value to the return stack.
+ */
LIBALEE_SECTION
inline void pushr(Cell value) {
verify(rsp < rstack + ReturnStackSize, Error::pushr);
*rsp++ = value;
}
+ /**
+ * Pops a value from the return stack and returns that value.
+ */
LIBALEE_SECTION
inline Cell popr() {
verify(rsp > rstack, Error::popr);
return *--rsp;
}
+ /**
+ * Returns the value stored at the current data stack position.
+ */
LIBALEE_SECTION
inline Cell& top() {
verify(dsp > dstack, Error::top);
return *(dsp - 1);
}
+ /**
+ * Picks a value currently stored on the data stack.
+ * @param i Index from current position to fetch from
+ * @return The value stored at the given index
+ */
LIBALEE_SECTION
inline Cell& pick(std::size_t i) {
verify(dsp - i > dstack, Error::pick);
return *(dsp - i - 1);
}
- // Advances the instruction pointer and returns that cell's contents.
+ /**
+ * Advances the instruction pointer and returns that cell's contents.
+ */
LIBALEE_SECTION
inline Cell beyondip() {
context.ip += sizeof(Cell);
return dict.read(context.ip);
}
+ /**
+ * Asserts the given condition is true, longjmp-ing if false.
+ * Used as an exception handler and the method of exiting execution.
+ * @param condition Condition to be tested
+ * @param error Error code to report via longjmp() on false condition
+ */
LIBALEE_SECTION
inline void verify(bool condition, Error error) {
if (!condition)
@@ -135,13 +192,13 @@ public:
}
private:
- InputFunc inputfunc; // User-provided function to collect "stdin" input.
- Context context;
+ InputFunc inputfunc; /** User-provided function to collect user input. */
+ Context context; /** State's current execution context. */
- Cell dstack[DataStackSize] = {};
- Cell rstack[ReturnStackSize] = {};
- Cell *dsp = dstack;
- Cell *rsp = rstack;
+ Cell dstack[DataStackSize] = {}; /** Data stack */
+ Cell rstack[ReturnStackSize] = {}; /** Return stack */
+ Cell *dsp = dstack; /** Current data stack position */
+ Cell *rsp = rstack; /** Current return stack position */
};
#endif // ALEEFORTH_STATE_HPP
diff --git a/libalee/types.hpp b/libalee/types.hpp
index 028c490..7b5bb62 100644
--- a/libalee/types.hpp
+++ b/libalee/types.hpp
@@ -1,20 +1,22 @@
-/**
- * Alee Forth: A portable and concise Forth implementation in modern C++.
- * Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
- *
- * This program is free software: you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation, either version 3 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public License
- * along with this program. If not, see <https://www.gnu.org/licenses/>.
- */
+//
+/// @file types.hpp
+/// @brief Defines common types used throughout Alee Forth.
+//
+// Alee Forth: A portable and concise Forth implementation in modern C++.
+// Copyright (C) 2023 Clyne Sullivan <clyne@bitgloo.com>
+//
+// This program is free software: you can redistribute it and/or modify
+// it under the terms of the GNU Lesser General Public License as published by
+// the Free Software Foundation, either version 3 of the License, or
+// (at your option) any later version.
+//
+// This program is distributed in the hope that it will be useful,
+// but WITHOUT ANY WARRANTY; without even the implied warranty of
+// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+// GNU Lesser General Public License for more details.
+//
+// You should have received a copy of the GNU Lesser General Public License
+// along with this program. If not, see <https://www.gnu.org/licenses/>.
#ifndef ALEEFORTH_TYPES_HPP
#define ALEEFORTH_TYPES_HPP
@@ -22,55 +24,86 @@
#include <cstdint>
#include <iterator>
-/**
- * Configure the below types for your platform.
- */
+/** Dictionary address type. Must be equivalent to "unsigned Cell". */
using Addr = uint16_t;
+/** Data cell type. Dictionary is basically an array of this type. */
using Cell = int16_t;
+/** Double-width cell type. Must be twice the size of Cell. */
using DoubleCell = int32_t;
-using DoubleAddr = uint32_t; // Only used for um/mod.
+/** Double-width addr type. Must be twice the size of Addr. Used by um/mod. */
+using DoubleAddr = uint32_t;
struct Dictionary;
struct State;
-using Func = void (*)(State&);
-
+/**
+ * Error enum to report success or failure of parsing or execution.
+ */
enum class Error : int {
- none = 0,
- push,
- pop,
- pushr,
- popr,
- top,
- pick,
- exit,
- noword
+ none = 0, /** No error */
+ push, /** Could not push (data stack overflow) */
+ pop, /** Could not pop (data stack underflow) */
+ pushr, /** Could not push (return stack overflow) */
+ popr, /** Could not pop (return stack underflow) */
+ top, /** Could not fetch data stack top (data stack underflow) */
+ pick, /** Could not pick data stack value (data stack underflow) */
+ exit, /** No error, exited from State::execute() */
+ noword /** Parsing failed because the word was not found */
};
/**
- * Stores the start and past-the-end addresses of a dictionary's word.
+ * @class Word
+ * Stores the beginning and end indices of a dictionary-defined word.
*/
class Word
{
+ /** Beginning (inclusive) index */
Addr start;
+ /** End (exclusive) index */
Addr wend;
public:
struct iterator;
+ /**
+ * Constructs a word with the given start and end indices.
+ * @param s Start/beginning index
+ * @param e (past-the-)end index
+ */
constexpr explicit Word(Addr s = 0, Addr e = 0):
start(s), wend(e) {}
+ /**
+ * Constructs a word using beginning index and length.
+ * @param s Beginning/start index of word
+ * @param l Count of bytes until end of word
+ * @return Resulting Word object
+ */
LIBALEE_SECTION
static constexpr Word fromLength(Addr s, Addr l) {
return Word(s, s + l);
}
+ /** Returns the size of this word in bytes. */
Addr size() const noexcept;
- iterator begin(const Dictionary *);
- iterator end(const Dictionary *);
-
+ /**
+ * Creates a beginning iterator for the word.
+ * @param dict Pointer to dictionary object containing this word
+ * @return Iterator pointing to this word's beginning
+ */
+ iterator begin(const Dictionary *dict);
+
+ /**
+ * Creates an end iterator for the word.
+ * @param dict Pointer to dictionary object containing this word
+ * @return Iterator pointing to past-the-end of this word
+ */
+ iterator end(const Dictionary *dict);
+
+ /**
+ * Forward-iterator for iterating through the letters of this word.
+ */
struct iterator {
using iterator_category = std::input_iterator_tag;
using value_type = uint8_t;
@@ -78,15 +111,26 @@ public:
using reference = void;
using difference_type = Cell;
+ /** Iterator's current address within its containing dictionary. */
Addr addr;
+ /** Pointer to dictionary that contains this word. */
const Dictionary *dict;
+ /**
+ * Constructs a word iterator.
+ * @param a The address the iterator points to
+ * @param d The dictionary that contains this word
+ */
constexpr iterator(Addr a, const Dictionary *d):
addr(a), dict(d) {}
+ /** Prefix increment */
iterator& operator++();
+ /** Postfix increment */
iterator operator++(int);
+ /** Returns value pointed to by iterator */
value_type operator*();
+ /** Iterator comparison function (case-insensitive) */
bool operator!=(const iterator&);
};
};