MIXAL
expression.cpp
Go to the documentation of this file.
1 #include <cassert>
2 #include <limits>
3 #include <iostream>
4 #include "expression.h"
5 
11 namespace mixal {
12 
13 Expression::Expression() : _evaluated(false), _result(), _literalConstant(false),
14  _depends(), _atomics(), _operations() {
15 }
16 
17 Expression::Expression(const std::string& expression, const std::string& lineSymbol) :
18  _evaluated(false), _result(), _literalConstant(false),
19  _depends(), _atomics(), _operations() {
20  parse(expression, lineSymbol);
21 }
22 
24  auto expr = Expression();
25  expr._evaluated = true;
26  expr._result = value;
27  expr._atomics.emplace_back(Atomic(AtomicType::INTEGER, value.value));
28  return expr;
29 }
30 
31 Expression Expression::getConstExpression(const std::string& symbol) {
32  auto expr = Expression();
33  expr._atomics.emplace_back(Atomic(AtomicType::SYMBOL, symbol));
34  expr._depends.insert(symbol);
35  return expr;
36 }
37 
38 Expression Expression::getConstOffsetExpression(const std::string& symbol, int32_t offset) {
39  auto expr = Expression();
40  expr._atomics = {Atomic(AtomicType::SYMBOL, symbol), Atomic(AtomicType::INTEGER, offset)};
41  expr._operations = {Operation::ADD};
42  expr._depends.insert(symbol);
43  return expr;
44 }
45 
46 bool Expression::isValidFirst(char ch) {
47  return isalnum(ch) || ch == '+' || ch == '-' || ch == '*' || ch == '=';
48 }
49 
50 bool Expression::isValidChar(char ch) {
51  return isValidFirst(ch) || ch == '/' || ch == ':';
52 }
53 
77 enum class ExprParseState {
78  START,
79  ATOMIC,
80  OPERATION,
81  END,
82 };
83 
85 inline bool isOperationFirst(char ch) {
86  return ch == '+' || ch == '-' || ch == '*' || ch == '/' || ch == ':';
87 }
88 
89 void Expression::parse(const std::string& expression, const std::string& lineSymbol) {
90  this->reset();
91  const char END_CHAR = '#'; // The character that indicates the end of the input.
92  const int INIT_INDEX = -1; // The uninitialized index value.
93  ExprParseState state = ExprParseState::START;
94  int lastAtomicStart = INIT_INDEX; // The start index of the last atomic.
95  int lastOperationStart = INIT_INDEX; // The start index of the last operation.
96 
97  // Check whether this is a literal constant that starts and ends with a `=`.
98  int start = 0;
99  int exprLen = static_cast<int>(expression.size());
100  if (exprLen > 2 && expression[0] == '=' && expression[exprLen - 1] == '=') {
101  _literalConstant = true;
102  start = 1;
103  --exprLen;
104  }
105 
106  // Parsing the expression.
107  for (int i = start; i <= exprLen; ++i) {
108  char ch = i < exprLen ? expression[i] : END_CHAR;
109  switch (state) {
110  case ExprParseState::START:
111  if (ch == '+' || ch == '-' || ch == '*' || isalnum(ch)) {
112  state = ExprParseState::ATOMIC;
113  lastAtomicStart = i;
114  } else if (ch == END_CHAR) {
115  throw ExpressionError(i, "The expression is empty.");
116  } else {
117  throw ExpressionError(i,
118  "Invalid character found at the start of the expression: " + std::string(1, ch));
119  }
120  break;
121 
122  case ExprParseState::ATOMIC:
123  assert(lastAtomicStart != INIT_INDEX);
124  if (expression[lastAtomicStart] == '*' ||
125  (lastAtomicStart + 1 < i &&
126  (expression[lastAtomicStart] == '+' || expression[lastAtomicStart] == '-') &&
127  expression[lastAtomicStart + 1] == '*')) {
128  // The atomic that matches `*`, `+*`, or `-*`.
129  if (ch == END_CHAR) {
130  state = ExprParseState::END;
131  } else if (isOperationFirst(ch)) {
132  state = ExprParseState::OPERATION;
133  lastOperationStart = i;
134  } else {
135  throw ExpressionError(i,
136  "Invalid character found while trying to find an operation: " + std::string(1, ch));
137  }
138  bool negative = expression[lastAtomicStart] == '-';
139  _atomics.emplace_back(Atomic(AtomicType::ASTERISK, lineSymbol, negative));
140  _depends.insert(lineSymbol);
141  } else if (isalnum(ch) ||
142  ((expression[lastAtomicStart] == '+' || expression[lastAtomicStart] == '-') &&
143  lastAtomicStart + 1 == i && ch == '*')) {
144  } else {
145  if (ch == END_CHAR) {
146  state = ExprParseState::END;
147  } else if (isOperationFirst(ch)) {
148  state = ExprParseState::OPERATION;
149  lastOperationStart = i;
150  } else {
151  throw ExpressionError(i,
152  "Invalid character found while trying to find an operation: " + std::string(1, ch));
153  }
154  bool isInteger = true, negative = false;
155  int32_t integerValue = 0;
156  if (expression[lastAtomicStart] == '-') {
157  negative = true;
158  ++lastAtomicStart;
159  } else if (expression[lastAtomicStart] == '+') {
160  ++lastAtomicStart;
161  }
162  if (lastAtomicStart == i) {
163  throw ExpressionError(i, "The atomic is empty: " +
164  std::to_string(expression[lastAtomicStart - 1]));
165  }
166  // Check the type of the atomic. Note that symbols can start with digits.
167  for (int j = lastAtomicStart; j < i; ++j) {
168  if (isalpha(expression[j])) {
169  isInteger = false;
170  break;
171  }
172  int32_t digit = expression[j] - '0';
173  if (integerValue > (std::numeric_limits<int32_t>::max() - digit) / 10) {
174  throw ExpressionError(i, "The integer value is too large: " +
175  expression.substr(lastAtomicStart, i - lastAtomicStart));
176  }
177  integerValue = integerValue * 10 + digit;
178  }
179  if (isInteger) {
180  _atomics.emplace_back(Atomic(AtomicType::INTEGER, integerValue, negative));
181  } else {
182  auto symbol = expression.substr(lastAtomicStart, i - lastAtomicStart);
183  _atomics.emplace_back(Atomic(AtomicType::SYMBOL, symbol, negative));
184  _depends.insert(symbol);
185  }
186  }
187  break;
188 
189  case ExprParseState::OPERATION:
190  assert(lastOperationStart != INIT_INDEX);
191  if (ch == '/') {
192  // The `/` could be continuous for `//`.
193  } else if (ch == END_CHAR) {
194  throw ExpressionError(i, "No atomic found after the binary operator");
195  } else {
196  state = ExprParseState::ATOMIC;
197  lastAtomicStart = i;
198  if (i - lastOperationStart == 1) {
199  switch (expression[lastOperationStart]) {
200  case '+':
201  _operations.emplace_back(Operation::ADD);
202  break;
203  case '-':
204  _operations.emplace_back(Operation::SUBTRACT);
205  break;
206  case '*':
207  _operations.emplace_back(Operation::MULTIPLY);
208  break;
209  case '/':
210  _operations.emplace_back(Operation::FLOOR_DIV);
211  break;
212  case ':':
213  _operations.emplace_back(Operation::FIELD);
214  break;
215  }
216  } else {
217  // TODO(admin): Add float division.
218  throw ExpressionError(i, "Unknown binary operator found");
219  }
220  }
221  break;
222 
223  case ExprParseState::END:
224  break;
225  }
226  }
227  // The parsing should always end with END state.
228  assert(state == ExprParseState::END);
229  // Since all the operations are binary, there should be exactly one more operations than atomics.
230  assert(_atomics.size() == _operations.size() + 1);
231 }
232 
233 bool Expression::evaluate(const std::unordered_map<std::string, AtomicValue>& constants) {
234  if (_atomics.size() == 0) {
235  return false;
236  }
237  auto evalAtomic = [&constants](const Atomic& atomic, AtomicValue* result) -> bool {
238  if (atomic.type == AtomicType::INTEGER) {
239  result->negative = atomic.negative;
240  result->value = atomic.integer;
241  if (atomic.negative) {
242  result->value = -result->value;
243  }
244  } else {
245  auto it = constants.find(atomic.symbol);
246  if (it == constants.end()) {
247  return false;
248  }
249  *result = it->second;
250  if (atomic.negative) {
251  result->negative = !result->negative;
252  result->value = -result->value;
253  }
254  }
255  return true;
256  };
257  AtomicValue first, second;
258  if (!evalAtomic(_atomics[0], &first)) {
259  return false;
260  }
261  for (size_t i = 0; i < _operations.size(); ++i) {
262  if (!evalAtomic(_atomics[i + 1], &second)) {
263  return false;
264  }
265  switch (_operations[i]) {
266  case Operation::ADD:
267  first.value += second.value;
268  break;
269  case Operation::SUBTRACT:
270  first.value -= second.value;
271  break;
272  case Operation::MULTIPLY:
273  first.value *= second.value;
274  break;
275  case Operation::FLOOR_DIV:
276  first.value /= second.value;
277  break;
278  case Operation::FIELD:
279  first.value = first.value * 8 + second.value;
280  break;
281  }
282  if (first.value > 0) {
283  first.negative = false;
284  } else if (first.value < 0) {
285  first.negative = true;
286  }
287  }
288  _evaluated = true;
289  _result = first;
290  return true;
291 }
292 
293 void Expression::replaceSymbol(const std::unordered_map<std::string, std::string>& mapping) {
294  for (auto& atomic : _atomics) {
295  if (atomic.type == AtomicType::SYMBOL) {
296  auto it = mapping.find(atomic.symbol);
297  if (it != mapping.end()) {
298  atomic.replaceSymbol(it->second);
299  _depends.erase(it->first);
300  _depends.insert(it->second);
301  }
302  }
303  }
304 }
305 
307  _evaluated = false;
308  _literalConstant = false;
309  _depends.clear();
310  _atomics.clear();
311  _operations.clear();
312 }
313 
314 bool Expression::operator==(const Expression& expression) {
315  if (_atomics.size() != expression._atomics.size()) {
316  return false;
317  }
318  for (size_t i = 0; i < _atomics.size(); ++i) {
319  if (_atomics[i] != expression._atomics[i]) {
320  return false;
321  }
322  }
323  for (size_t i = 0; i < _operations.size(); ++i) {
324  if (_operations[i] != expression._operations[i]) {
325  return false;
326  }
327  }
328  return true;
329 }
330 
331 bool Expression::operator!=(const Expression& expression) {
332  return !((*this) == expression);
333 }
334 
335 std::ostream& operator<<(std::ostream& out, Operation operation) {
336  switch (operation) {
337  case Operation::ADD: out << '+'; break;
338  case Operation::SUBTRACT: out << '-'; break;
339  case Operation::MULTIPLY: out << '*'; break;
340  case Operation::FLOOR_DIV: out << '/'; break;
341  case Operation::FIELD: out << ':'; break;
342  }
343  return out;
344 }
345 
346 std::ostream& operator<<(std::ostream& out, const Expression& expression) {
347  if (expression._atomics.size() > 0) {
348  out << expression._atomics[0];
349  }
350  for (size_t i = 0; i < expression._operations.size(); ++i) {
351  out << expression._operations[i];
352  out << expression._atomics[i + 1];
353  }
354  return out;
355 }
356 
357 }; // namespace mixal
expression.h
To parse the expressions.
mixal::Expression::operator==
bool operator==(const Expression &expression)
Definition: expression.cpp:314
mixal::Expression::replaceSymbol
void replaceSymbol(const std::unordered_map< std::string, std::string > &mapping)
Definition: expression.cpp:293
mixal::ExprParseState
ExprParseState
Definition: expression.cpp:77
mixal::Expression::isValidFirst
static bool isValidFirst(char ch)
Definition: expression.cpp:46
mixal::Atomic::negative
bool negative
Definition: expression.h:27
mixal::Expression::getConstOffsetExpression
static Expression getConstOffsetExpression(const std::string &symbol, int32_t offset)
Definition: expression.cpp:38
mixal::Expression::isValidChar
static bool isValidChar(char ch)
Definition: expression.cpp:50
mixal::Operation
Operation
Definition: expression.h:90
mixal::Atomic::integer
int32_t integer
Definition: expression.h:28
mixal::Expression::parse
void parse(const std::string &expression, const std::string &lineSymbol)
Definition: expression.cpp:89
mixal::Expression::evaluate
bool evaluate(const std::unordered_map< std::string, AtomicValue > &constants)
Definition: expression.cpp:233
mixal::Expression::reset
void reset()
Definition: expression.cpp:306
mixal::Expression::getConstExpression
static Expression getConstExpression(const AtomicValue &value)
Definition: expression.cpp:23
mixal::Atomic::type
AtomicType type
Definition: expression.h:26
mixal::Atomic::symbol
std::string symbol
Definition: expression.h:29
mixal::operator<<
std::ostream & operator<<(std::ostream &out, Operation operation)
Definition: expression.cpp:335
mixal::Expression::operator!=
bool operator!=(const Expression &expression)
Definition: expression.cpp:331
mixal::AtomicValue
Definition: expression.h:75
mixal::Expression::result
const AtomicValue & result() const
Definition: expression.h:146
mixal::Expression::Expression
Expression()
Definition: expression.cpp:13
mixal::Expression
Definition: expression.h:103
mixal::isOperationFirst
bool isOperationFirst(char ch)
Definition: expression.cpp:85
mixal::Atomic
Definition: expression.h:25
mixal::ExpressionError
Definition: errors.h:15