3 * This source code is part of
7 * GROningen MAchine for Chemical Simulations
9 * Written by David van der Spoel, Erik Lindahl, Berk Hess, and others.
10 * Copyright (c) 1991-2000, University of Groningen, The Netherlands.
11 * Copyright (c) 2001-2009, The GROMACS development team,
12 * check out http://www.gromacs.org for more information.
14 * This program is free software; you can redistribute it and/or
15 * modify it under the terms of the GNU General Public License
16 * as published by the Free Software Foundation; either version 2
17 * of the License, or (at your option) any later version.
19 * If you want to redistribute modifications, please consider that
20 * scientific software is very special. Version control is crucial -
21 * bugs must be traceable. We will be happy to consider code for
22 * inclusion in the official distribution, but derived work must not
23 * be called official GROMACS. Details are found in the README & COPYING
24 * files - if they are missing, get the official version at www.gromacs.org.
26 * To help us fund GROMACS development, we humbly ask that you cite
27 * the papers on the package - you can find them in the top README file.
29 * For more info, check our website at http://www.gromacs.org
32 * \brief Helper functions for the selection tokenizer.
34 * This file implements the functions in the headers scanner.h and
37 * \author Teemu Murtola <teemu.murtola@cbr.su.se>
38 * \ingroup module_selection
41 * \internal \file scanner_flex.h
42 * \brief Generated (from scanner.l) header file by Flex.
44 * This file contains definitions of functions that are needed in
45 * scanner_internal.cpp.
47 * \ingroup module_selection
59 #include "gromacs/legacyheaders/typedefs.h"
60 #include "gromacs/legacyheaders/smalloc.h"
61 #include "gromacs/legacyheaders/string2.h"
63 #include "gromacs/utility/errorcodes.h"
64 #include "gromacs/utility/exceptions.h"
65 #include "gromacs/utility/gmxassert.h"
66 #include "gromacs/utility/messagestringcollector.h"
67 #include "gromacs/utility/stringutil.h"
69 #include "parsetree.h"
70 #include "selectioncollection-impl.h"
72 #include "selmethod.h"
77 #include "scanner_internal.h"
79 //! Step in which the allocated memory for pretty-printed input is incremented.
80 #define STRSTORE_ALLOCSTEP 1000
82 /* These are defined as macros in the generated scanner_flex.h.
83 * We undefine them here to have them as variable names in the subroutines.
84 * There are other ways of doing this, but this is probably the easiest. */
90 * Handles initialization of method parameter token.
93 init_param_token(YYSTYPE *yylval, gmx_ana_selparam_t *param, bool bBoolNo)
97 GMX_RELEASE_ASSERT(param->name != NULL,
98 "bBoolNo should only be set for a parameters with a name");
99 snew(yylval->str, strlen(param->name) + 3);
100 yylval->str[0] = 'n';
101 yylval->str[1] = 'o';
102 strcpy(yylval->str+2, param->name);
106 yylval->str = param->name ? strdup(param->name) : NULL;
112 * Processes a selection method token.
115 init_method_token(YYSTYPE *yylval, gmx_ana_selmethod_t *method, bool bPosMod,
116 gmx_sel_lexer_t *state)
118 /* If the previous token was not KEYWORD_POS, return EMPTY_POSMOD
119 * before the actual method to work around a limitation in Bison. */
120 if (!bPosMod && method->type != POS_VALUE)
122 state->nextmethod = method;
125 yylval->meth = method;
126 if (!(method->flags & SMETH_MODIFIER) && method->nparams == 0)
129 switch (method->type)
131 case INT_VALUE: return KEYWORD_NUMERIC;
132 case REAL_VALUE: return KEYWORD_NUMERIC;
133 case STR_VALUE: return KEYWORD_STR;
134 case GROUP_VALUE: return KEYWORD_GROUP;
136 GMX_ERROR_NORET(gmx::eeInternalError, "Unsupported keyword type");
142 /* Method with parameters or a modifier */
143 if (method->flags & SMETH_MODIFIER)
145 /* Remove all methods from the stack */
147 if (method->param[1].name == NULL)
149 state->nextparam = &method->param[1];
154 if (method->param[0].name == NULL)
156 state->nextparam = &method->param[0];
160 if (state->msp >= state->mstack_alloc)
162 state->mstack_alloc += 10;
163 srenew(state->mstack, state->mstack_alloc);
165 state->mstack[state->msp] = method;
166 if (method->flags & SMETH_MODIFIER)
170 switch (method->type)
172 case INT_VALUE: return METHOD_NUMERIC;
173 case REAL_VALUE: return METHOD_NUMERIC;
174 case POS_VALUE: return METHOD_POS;
175 case GROUP_VALUE: return METHOD_GROUP;
178 GMX_ERROR_NORET(gmx::eeInternalError, "Unsupported method type");
182 return INVALID; /* Should not be reached */
186 _gmx_sel_lexer_process_pending(YYSTYPE *yylval, gmx_sel_lexer_t *state)
188 if (state->nextparam)
190 gmx_ana_selparam_t *param = state->nextparam;
191 bool bBoolNo = state->bBoolNo;
196 return END_OF_METHOD;
198 state->nextparam = NULL;
199 state->bBoolNo = false;
200 _gmx_sel_lexer_add_token(param->name, -1, state);
201 return init_param_token(yylval, param, bBoolNo);
203 if (state->prev_pos_kw > 0)
205 --state->prev_pos_kw;
207 if (state->nextmethod)
209 gmx_ana_selmethod_t *method = state->nextmethod;
211 state->nextmethod = NULL;
212 return init_method_token(yylval, method, true, state);
218 _gmx_sel_lexer_process_identifier(YYSTYPE *yylval, char *yytext, size_t yyleng,
219 gmx_sel_lexer_t *state)
221 /* Check if the identifier matches with a parameter name */
224 gmx_ana_selparam_t *param = NULL;
225 bool bBoolNo = false;
227 while (!param && sp >= 0)
230 for (i = 0; i < state->mstack[sp]->nparams; ++i)
232 /* Skip NULL parameters and too long parameters */
233 if (state->mstack[sp]->param[i].name == NULL
234 || strlen(state->mstack[sp]->param[i].name) > yyleng)
238 if (!strncmp(state->mstack[sp]->param[i].name, yytext, yyleng))
240 param = &state->mstack[sp]->param[i];
243 /* Check separately for a 'no' prefix on boolean parameters */
244 if (state->mstack[sp]->param[i].val.type == NO_VALUE
245 && yyleng > 2 && yytext[0] == 'n' && yytext[1] == 'o'
246 && !strncmp(state->mstack[sp]->param[i].name, yytext+2, yyleng-2))
248 param = &state->mstack[sp]->param[i];
260 if (param->val.type == NO_VALUE && !bBoolNo)
262 state->bMatchBool = true;
266 state->neom = state->msp - sp - 1;
267 state->nextparam = param;
268 state->bBoolNo = bBoolNo;
269 return END_OF_METHOD;
271 _gmx_sel_lexer_add_token(param->name, -1, state);
272 return init_param_token(yylval, param, bBoolNo);
276 /* Check if the identifier matches with a symbol */
277 const gmx::SelectionParserSymbol *symbol
278 = state->sc->symtab->findSymbol(std::string(yytext, yyleng), false);
279 /* If there is no match, return the token as a string */
282 yylval->str = gmx_strndup(yytext, yyleng);
283 _gmx_sel_lexer_add_token(yytext, yyleng, state);
286 _gmx_sel_lexer_add_token(symbol->name().c_str(), -1, state);
287 gmx::SelectionParserSymbol::SymbolType symtype = symbol->type();
288 /* Reserved symbols should have been caught earlier */
289 if (symtype == gmx::SelectionParserSymbol::ReservedSymbol)
291 GMX_THROW(gmx::InternalError(gmx::formatString(
292 "Mismatch between tokenizer and reserved symbol table (for '%s')",
293 symbol->name().c_str())));
295 /* For variable symbols, return the type of the variable value */
296 if (symtype == gmx::SelectionParserSymbol::VariableSymbol)
298 gmx::SelectionTreeElementPointer var = symbol->variableValue();
299 /* Return simple tokens for constant variables */
300 if (var->type == SEL_CONST)
305 yylval->i = var->v.u.i[0];
308 yylval->r = var->v.u.r[0];
313 GMX_ERROR_NORET(gmx::eeInternalError,
314 "Unsupported variable type");
318 yylval->sel = new gmx::SelectionTreeElementPointer(var);
321 case INT_VALUE: return VARIABLE_NUMERIC;
322 case REAL_VALUE: return VARIABLE_NUMERIC;
323 case POS_VALUE: return VARIABLE_POS;
324 case GROUP_VALUE: return VARIABLE_GROUP;
327 GMX_ERROR_NORET(gmx::eeInternalError,
328 "Unsupported variable type");
332 return INVALID; /* Should not be reached. */
334 /* For method symbols, return the correct type */
335 if (symtype == gmx::SelectionParserSymbol::MethodSymbol)
337 gmx_ana_selmethod_t *method = symbol->methodValue();
338 return init_method_token(yylval, method, state->prev_pos_kw > 0, state);
340 /* For position symbols, we need to return KEYWORD_POS, but we also need
341 * some additional handling. */
342 if (symtype == gmx::SelectionParserSymbol::PositionSymbol)
344 state->bMatchOf = true;
345 yylval->str = strdup(symbol->name().c_str());
346 state->prev_pos_kw = 2;
349 /* Should not be reached */
354 _gmx_sel_lexer_add_token(const char *str, int len, gmx_sel_lexer_t *state)
356 /* Do nothing if the string is empty, or if it is a space and there is
357 * no other text yet, or if there already is a space. */
358 if (!str || len == 0 || strlen(str) == 0
359 || (str[0] == ' ' && str[1] == 0
360 && (state->pslen == 0 || state->pselstr[state->pslen - 1] == ' ')))
368 /* Allocate more memory if necessary */
369 if (state->nalloc_psel - state->pslen < len)
371 int incr = STRSTORE_ALLOCSTEP < len ? len : STRSTORE_ALLOCSTEP;
372 state->nalloc_psel += incr;
373 srenew(state->pselstr, state->nalloc_psel);
375 /* Append the token to the stored string */
376 strncpy(state->pselstr + state->pslen, str, len);
378 state->pselstr[state->pslen] = 0;
382 _gmx_sel_init_lexer(yyscan_t *scannerp, struct gmx_ana_selcollection_t *sc,
383 bool bInteractive, int maxnr, bool bGroups,
384 struct gmx_ana_indexgrps_t *grps)
386 int rc = _gmx_sel_yylex_init(scannerp);
389 // TODO: Throw a more representative exception.
390 GMX_THROW(gmx::InternalError("Lexer initialization failed"));
393 gmx_sel_lexer_t *state = new gmx_sel_lexer_t;
396 state->errors = NULL;
397 state->bGroups = bGroups;
399 state->nexpsel = (maxnr > 0 ? static_cast<int>(sc->sel.size()) + maxnr : -1);
401 state->bInteractive = bInteractive;
403 snew(state->pselstr, STRSTORE_ALLOCSTEP);
404 state->pselstr[0] = 0;
406 state->nalloc_psel = STRSTORE_ALLOCSTEP;
408 snew(state->mstack, 20);
409 state->mstack_alloc = 20;
412 state->nextparam = NULL;
413 state->nextmethod = NULL;
414 state->prev_pos_kw = 0;
415 state->bBoolNo = false;
416 state->bMatchOf = false;
417 state->bMatchBool = false;
418 state->bCmdStart = true;
419 state->bBuffer = false;
421 _gmx_sel_yyset_extra(state, *scannerp);
425 _gmx_sel_free_lexer(yyscan_t scanner)
427 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
429 sfree(state->pselstr);
430 sfree(state->mstack);
433 _gmx_sel_yy_delete_buffer(state->buffer, scanner);
436 _gmx_sel_yylex_destroy(scanner);
440 _gmx_sel_set_lexer_error_reporter(yyscan_t scanner,
441 gmx::MessageStringCollector *errors)
443 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
444 state->errors = errors;
448 _gmx_sel_lexer_set_exception(yyscan_t scanner,
449 const boost::exception_ptr &ex)
451 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
452 state->exception = ex;
456 _gmx_sel_lexer_rethrow_exception_if_occurred(yyscan_t scanner)
458 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
459 if (state->exception)
461 boost::exception_ptr ex = state->exception;
462 state->exception = boost::exception_ptr();
463 rethrow_exception(ex);
468 _gmx_sel_is_lexer_interactive(yyscan_t scanner)
470 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
471 return state->bInteractive;
474 struct gmx_ana_selcollection_t *
475 _gmx_sel_lexer_selcollection(yyscan_t scanner)
477 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
481 gmx::MessageStringCollector *
482 _gmx_sel_lexer_error_reporter(yyscan_t scanner)
484 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
485 GMX_RELEASE_ASSERT(state->errors != NULL, "Error reporter not set");
486 return state->errors;
490 _gmx_sel_lexer_has_groups_set(yyscan_t scanner)
492 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
493 return state->bGroups;
496 struct gmx_ana_indexgrps_t *
497 _gmx_sel_lexer_indexgrps(yyscan_t scanner)
499 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
504 _gmx_sel_lexer_exp_selcount(yyscan_t scanner)
506 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
507 return state->nexpsel;
511 _gmx_sel_lexer_pselstr(yyscan_t scanner)
513 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
514 return state->pselstr;
518 _gmx_sel_lexer_clear_pselstr(yyscan_t scanner)
520 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
521 state->pselstr[0] = 0;
526 _gmx_sel_lexer_clear_method_stack(yyscan_t scanner)
528 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
534 _gmx_sel_finish_method(yyscan_t scanner)
536 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
545 _gmx_sel_set_lex_input_file(yyscan_t scanner, FILE *fp)
547 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
549 state->bBuffer = true;
550 state->buffer = _gmx_sel_yy_create_buffer(fp, YY_BUF_SIZE, scanner);
551 _gmx_sel_yy_switch_to_buffer(state->buffer, scanner);
555 _gmx_sel_set_lex_input_str(yyscan_t scanner, const char *str)
557 gmx_sel_lexer_t *state = _gmx_sel_yyget_extra(scanner);
561 _gmx_sel_yy_delete_buffer(state->buffer, scanner);
563 state->bBuffer = true;
564 state->buffer = _gmx_sel_yy_scan_string(str, scanner);