MIXAL
Public Member Functions | Static Public Member Functions | Friends | List of all members
mixal::Expression Class Reference

#include <expression.h>

Public Member Functions

 Expression ()
 
 Expression (const std::string &expression, const std::string &lineSymbol="")
 
bool evaluated () const
 
const AtomicValueresult () const
 
bool literalConstant () const
 
const std::unordered_set< std::string > depends () const
 
const std::vector< Atomicatomics () const
 
const std::vector< Operationoperations () const
 
void parse (const std::string &expression, const std::string &lineSymbol)
 
bool evaluate (const std::unordered_map< std::string, AtomicValue > &constants)
 
void replaceSymbol (const std::unordered_map< std::string, std::string > &mapping)
 
void reset ()
 
bool operator== (const Expression &expression)
 
bool operator!= (const Expression &expression)
 

Static Public Member Functions

static Expression getConstExpression (const AtomicValue &value)
 
static Expression getConstExpression (const std::string &symbol)
 
static Expression getConstOffsetExpression (const std::string &symbol, int32_t offset)
 
static bool isValidFirst (char ch)
 
static bool isValidChar (char ch)
 

Friends

std::ostream & operator<< (std::ostream &out, const Expression &expression)
 

Detailed Description

Parse and store expressions.

Definition at line 103 of file expression.h.

Constructor & Destructor Documentation

◆ Expression() [1/2]

mixal::Expression::Expression ( )

Initialize with zeros.

Definition at line 13 of file expression.cpp.

13  : _evaluated(false), _result(), _literalConstant(false),
14  _depends(), _atomics(), _operations() {
15 }

Referenced by getConstExpression(), and getConstOffsetExpression().

◆ Expression() [2/2]

mixal::Expression::Expression ( const std::string &  expression,
const std::string &  lineSymbol = "" 
)
explicit

Initialize with parsing

See also
parse(const std::string&, const std::string&)

Definition at line 17 of file expression.cpp.

17  :
18  _evaluated(false), _result(), _literalConstant(false),
19  _depends(), _atomics(), _operations() {
20  parse(expression, lineSymbol);
21 }

References parse().

Member Function Documentation

◆ atomics()

const std::vector<Atomic> mixal::Expression::atomics ( ) const
inline

Get the atomics in the expression.

Definition at line 154 of file expression.h.

154 { return _atomics; }

◆ depends()

const std::unordered_set<std::string> mixal::Expression::depends ( ) const
inline

Get the symbols that should be evaluated before evaluating this expression.

Definition at line 152 of file expression.h.

152 { return _depends; }

◆ evaluate()

bool mixal::Expression::evaluate ( const std::unordered_map< std::string, AtomicValue > &  constants)

Try to evaluate the parsed expression.

Parameters
constantsA dictionary that maps from symbol names to evaluated atomic values.
Returns
Return true if the expression can be evaluated with the given dictionary.

Definition at line 233 of file expression.cpp.

233  {
234  if (_atomics.size() == 0) {
235  return false;
236  }
237  auto evalAtomic = [&constants](const Atomic& atomic, AtomicValue* result) -> bool {
238  if (atomic.type == AtomicType::INTEGER) {
239  result->negative = atomic.negative;
240  result->value = atomic.integer;
241  if (atomic.negative) {
242  result->value = -result->value;
243  }
244  } else {
245  auto it = constants.find(atomic.symbol);
246  if (it == constants.end()) {
247  return false;
248  }
249  *result = it->second;
250  if (atomic.negative) {
251  result->negative = !result->negative;
252  result->value = -result->value;
253  }
254  }
255  return true;
256  };
257  AtomicValue first, second;
258  if (!evalAtomic(_atomics[0], &first)) {
259  return false;
260  }
261  for (size_t i = 0; i < _operations.size(); ++i) {
262  if (!evalAtomic(_atomics[i + 1], &second)) {
263  return false;
264  }
265  switch (_operations[i]) {
266  case Operation::ADD:
267  first.value += second.value;
268  break;
269  case Operation::SUBTRACT:
270  first.value -= second.value;
271  break;
272  case Operation::MULTIPLY:
273  first.value *= second.value;
274  break;
275  case Operation::FLOOR_DIV:
276  first.value /= second.value;
277  break;
278  case Operation::FIELD:
279  first.value = first.value * 8 + second.value;
280  break;
281  }
282  if (first.value > 0) {
283  first.negative = false;
284  } else if (first.value < 0) {
285  first.negative = true;
286  }
287  }
288  _evaluated = true;
289  _result = first;
290  return true;
291 }

References mixal::Atomic::integer, mixal::Atomic::negative, result(), mixal::Atomic::symbol, and mixal::Atomic::type.

◆ evaluated()

bool mixal::Expression::evaluated ( ) const
inline

Whether the expression has been evaluated.

Definition at line 144 of file expression.h.

144 { return _evaluated; }

Referenced by mixal::ParsedResult::evaluated(), and mixal::operator<<().

◆ getConstExpression() [1/2]

Expression mixal::Expression::getConstExpression ( const AtomicValue value)
static

Get a constant expression based on a given atomic value.

Definition at line 23 of file expression.cpp.

23  {
24  auto expr = Expression();
25  expr._evaluated = true;
26  expr._result = value;
27  expr._atomics.emplace_back(Atomic(AtomicType::INTEGER, value.value));
28  return expr;
29 }

References Expression().

Referenced by mixal::Computer::loadCodes(), and mixal::Parser::parseLine().

◆ getConstExpression() [2/2]

Expression mixal::Expression::getConstExpression ( const std::string &  symbol)
static

Get a constant expression based on a given symbol.

The evaluation will depend on the given symbol.

Definition at line 31 of file expression.cpp.

31  {
32  auto expr = Expression();
33  expr._atomics.emplace_back(Atomic(AtomicType::SYMBOL, symbol));
34  expr._depends.insert(symbol);
35  return expr;
36 }

References Expression().

◆ getConstOffsetExpression()

Expression mixal::Expression::getConstOffsetExpression ( const std::string &  symbol,
int32_t  offset 
)
static

Get a constant expression based on a given symbol and an offset.

This is used for representing the offset from an address.

Definition at line 38 of file expression.cpp.

38  {
39  auto expr = Expression();
40  expr._atomics = {Atomic(AtomicType::SYMBOL, symbol), Atomic(AtomicType::INTEGER, offset)};
41  expr._operations = {Operation::ADD};
42  expr._depends.insert(symbol);
43  return expr;
44 }

References Expression().

Referenced by mixal::Computer::loadCodes().

◆ isValidChar()

bool mixal::Expression::isValidChar ( char  ch)
static

Whether a character is valid inside an expression.

Besides the valid characters at the beginning, the rest characters in the operations are also valid: / and :.

See also
isValidFirst(char)

Definition at line 50 of file expression.cpp.

50  {
51  return isValidFirst(ch) || ch == '/' || ch == ':';
52 }

References isValidFirst().

Referenced by mixal::Parser::parseLine().

◆ isValidFirst()

bool mixal::Expression::isValidFirst ( char  ch)
static

Whether an expression can start with the given character.

The first character could be:

  • [0-9A-Z], for symbols.
  • *, for current location.
  • [+-], for the sign of an atomic.
  • =, for literal constant.

Definition at line 46 of file expression.cpp.

46  {
47  return isalnum(ch) || ch == '+' || ch == '-' || ch == '*' || ch == '=';
48 }

Referenced by isValidChar(), and mixal::Parser::parseLine().

◆ literalConstant()

bool mixal::Expression::literalConstant ( ) const
inline

Whether this is a literal constant, which is surrounded by =.

Definition at line 149 of file expression.h.

149 { return _literalConstant; }

Referenced by mixal::Computer::executeSingle().

◆ operations()

const std::vector<Operation> mixal::Expression::operations ( ) const
inline

Get the operations in the expression.

Definition at line 156 of file expression.h.

156 { return _operations; }

◆ operator!=()

bool mixal::Expression::operator!= ( const Expression expression)

Whether two expressions are different.

Definition at line 331 of file expression.cpp.

331  {
332  return !((*this) == expression);
333 }

◆ operator==()

bool mixal::Expression::operator== ( const Expression expression)

Whether two expressions are the same.

Definition at line 314 of file expression.cpp.

314  {
315  if (_atomics.size() != expression._atomics.size()) {
316  return false;
317  }
318  for (size_t i = 0; i < _atomics.size(); ++i) {
319  if (_atomics[i] != expression._atomics[i]) {
320  return false;
321  }
322  }
323  for (size_t i = 0; i < _operations.size(); ++i) {
324  if (_operations[i] != expression._operations[i]) {
325  return false;
326  }
327  }
328  return true;
329 }

◆ parse()

void mixal::Expression::parse ( const std::string &  expression,
const std::string &  lineSymbol 
)

Try to parse an expression string.

Parameters
expressionA string containing only the expression.
lineSymbolThe symbol representing the current location. Used for * to point to the current location.
Exceptions
ExpressionErrorWhen the input expression string is invalid.

Definition at line 89 of file expression.cpp.

89  {
90  this->reset();
91  const char END_CHAR = '#'; // The character that indicates the end of the input.
92  const int INIT_INDEX = -1; // The uninitialized index value.
93  ExprParseState state = ExprParseState::START;
94  int lastAtomicStart = INIT_INDEX; // The start index of the last atomic.
95  int lastOperationStart = INIT_INDEX; // The start index of the last operation.
96 
97  // Check whether this is a literal constant that starts and ends with a `=`.
98  int start = 0;
99  int exprLen = static_cast<int>(expression.size());
100  if (exprLen > 2 && expression[0] == '=' && expression[exprLen - 1] == '=') {
101  _literalConstant = true;
102  start = 1;
103  --exprLen;
104  }
105 
106  // Parsing the expression.
107  for (int i = start; i <= exprLen; ++i) {
108  char ch = i < exprLen ? expression[i] : END_CHAR;
109  switch (state) {
110  case ExprParseState::START:
111  if (ch == '+' || ch == '-' || ch == '*' || isalnum(ch)) {
112  state = ExprParseState::ATOMIC;
113  lastAtomicStart = i;
114  } else if (ch == END_CHAR) {
115  throw ExpressionError(i, "The expression is empty.");
116  } else {
117  throw ExpressionError(i,
118  "Invalid character found at the start of the expression: " + std::string(1, ch));
119  }
120  break;
121 
122  case ExprParseState::ATOMIC:
123  assert(lastAtomicStart != INIT_INDEX);
124  if (expression[lastAtomicStart] == '*' ||
125  (lastAtomicStart + 1 < i &&
126  (expression[lastAtomicStart] == '+' || expression[lastAtomicStart] == '-') &&
127  expression[lastAtomicStart + 1] == '*')) {
128  // The atomic that matches `*`, `+*`, or `-*`.
129  if (ch == END_CHAR) {
130  state = ExprParseState::END;
131  } else if (isOperationFirst(ch)) {
132  state = ExprParseState::OPERATION;
133  lastOperationStart = i;
134  } else {
135  throw ExpressionError(i,
136  "Invalid character found while trying to find an operation: " + std::string(1, ch));
137  }
138  bool negative = expression[lastAtomicStart] == '-';
139  _atomics.emplace_back(Atomic(AtomicType::ASTERISK, lineSymbol, negative));
140  _depends.insert(lineSymbol);
141  } else if (isalnum(ch) ||
142  ((expression[lastAtomicStart] == '+' || expression[lastAtomicStart] == '-') &&
143  lastAtomicStart + 1 == i && ch == '*')) {
144  } else {
145  if (ch == END_CHAR) {
146  state = ExprParseState::END;
147  } else if (isOperationFirst(ch)) {
148  state = ExprParseState::OPERATION;
149  lastOperationStart = i;
150  } else {
151  throw ExpressionError(i,
152  "Invalid character found while trying to find an operation: " + std::string(1, ch));
153  }
154  bool isInteger = true, negative = false;
155  int32_t integerValue = 0;
156  if (expression[lastAtomicStart] == '-') {
157  negative = true;
158  ++lastAtomicStart;
159  } else if (expression[lastAtomicStart] == '+') {
160  ++lastAtomicStart;
161  }
162  if (lastAtomicStart == i) {
163  throw ExpressionError(i, "The atomic is empty: " +
164  std::to_string(expression[lastAtomicStart - 1]));
165  }
166  // Check the type of the atomic. Note that symbols can start with digits.
167  for (int j = lastAtomicStart; j < i; ++j) {
168  if (isalpha(expression[j])) {
169  isInteger = false;
170  break;
171  }
172  int32_t digit = expression[j] - '0';
173  if (integerValue > (std::numeric_limits<int32_t>::max() - digit) / 10) {
174  throw ExpressionError(i, "The integer value is too large: " +
175  expression.substr(lastAtomicStart, i - lastAtomicStart));
176  }
177  integerValue = integerValue * 10 + digit;
178  }
179  if (isInteger) {
180  _atomics.emplace_back(Atomic(AtomicType::INTEGER, integerValue, negative));
181  } else {
182  auto symbol = expression.substr(lastAtomicStart, i - lastAtomicStart);
183  _atomics.emplace_back(Atomic(AtomicType::SYMBOL, symbol, negative));
184  _depends.insert(symbol);
185  }
186  }
187  break;
188 
189  case ExprParseState::OPERATION:
190  assert(lastOperationStart != INIT_INDEX);
191  if (ch == '/') {
192  // The `/` could be continuous for `//`.
193  } else if (ch == END_CHAR) {
194  throw ExpressionError(i, "No atomic found after the binary operator");
195  } else {
196  state = ExprParseState::ATOMIC;
197  lastAtomicStart = i;
198  if (i - lastOperationStart == 1) {
199  switch (expression[lastOperationStart]) {
200  case '+':
201  _operations.emplace_back(Operation::ADD);
202  break;
203  case '-':
204  _operations.emplace_back(Operation::SUBTRACT);
205  break;
206  case '*':
207  _operations.emplace_back(Operation::MULTIPLY);
208  break;
209  case '/':
210  _operations.emplace_back(Operation::FLOOR_DIV);
211  break;
212  case ':':
213  _operations.emplace_back(Operation::FIELD);
214  break;
215  }
216  } else {
217  // TODO(admin): Add float division.
218  throw ExpressionError(i, "Unknown binary operator found");
219  }
220  }
221  break;
222 
223  case ExprParseState::END:
224  break;
225  }
226  }
227  // The parsing should always end with END state.
228  assert(state == ExprParseState::END);
229  // Since all the operations are binary, there should be exactly one more operations than atomics.
230  assert(_atomics.size() == _operations.size() + 1);
231 }

References mixal::isOperationFirst(), and reset().

Referenced by Expression(), and mixal::Parser::parseLine().

◆ replaceSymbol()

void mixal::Expression::replaceSymbol ( const std::unordered_map< std::string, std::string > &  mapping)

Replace the symbols in the expression.

This is used for replacing local symbols.

Definition at line 293 of file expression.cpp.

293  {
294  for (auto& atomic : _atomics) {
295  if (atomic.type == AtomicType::SYMBOL) {
296  auto it = mapping.find(atomic.symbol);
297  if (it != mapping.end()) {
298  atomic.replaceSymbol(it->second);
299  _depends.erase(it->first);
300  _depends.insert(it->second);
301  }
302  }
303  }
304 }

◆ reset()

void mixal::Expression::reset ( )

Clear the parsed results.

Definition at line 306 of file expression.cpp.

306  {
307  _evaluated = false;
308  _literalConstant = false;
309  _depends.clear();
310  _atomics.clear();
311  _operations.clear();
312 }

Referenced by parse().

◆ result()

const AtomicValue& mixal::Expression::result ( ) const
inline

Get the evaluated atomic value.

Definition at line 146 of file expression.h.

146 { return _result; }

Referenced by evaluate(), and mixal::operator<<().

Friends And Related Function Documentation

◆ operator<<

std::ostream& operator<< ( std::ostream &  out,
const Expression expression 
)
friend

Output the expression.

Definition at line 346 of file expression.cpp.

346  {
347  if (expression._atomics.size() > 0) {
348  out << expression._atomics[0];
349  }
350  for (size_t i = 0; i < expression._operations.size(); ++i) {
351  out << expression._operations[i];
352  out << expression._atomics[i + 1];
353  }
354  return out;
355 }

The documentation for this class was generated from the following files:
mixal::ExprParseState
ExprParseState
Definition: expression.cpp:77
mixal::Expression::isValidFirst
static bool isValidFirst(char ch)
Definition: expression.cpp:46
mixal::Expression::parse
void parse(const std::string &expression, const std::string &lineSymbol)
Definition: expression.cpp:89
mixal::Expression::reset
void reset()
Definition: expression.cpp:306
mixal::Expression::result
const AtomicValue & result() const
Definition: expression.h:146
mixal::Expression::Expression
Expression()
Definition: expression.cpp:13
mixal::isOperationFirst
bool isOperationFirst(char ch)
Definition: expression.cpp:85