upstream/dynamips-0.2.8-RC1/parser.c

/*
 * Cisco 7200 (Predator) simulation platform.
 * Copyright (c) 2006 Christophe Fillot (cf@utc.fr)
 *
 * Mini-parser.
 */

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <sys/mman.h>
#include <signal.h>
#include <fcntl.h>
#include <errno.h>
#include <assert.h>
#include <stdarg.h>
#include <sys/ioctl.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <arpa/inet.h>

#include "utils.h"
#include "parser.h"

#define TOKEN_MAX_SIZE  512

/* Parser states */
enum {
   PARSER_STATE_BLANK,
   PARSER_STATE_STRING,
   PARSER_STATE_QUOTED_STRING,
};

/* Character types */
enum {
   PARSER_CHAR_BLANK,
   PARSER_CHAR_NEWLINE,
   PARSER_CHAR_COMMENT,
   PARSER_CHAR_QUOTE,
   PARSER_CHAR_OTHER,
};

/* Get a description given an error code */
char *parser_strerror(int error)
{
   printf("error = %d\n",error);

   switch(error) {
      case PARSER_ERROR_NOMEM:
         return "insufficient memory";
      case PARSER_ERROR_UNEXP_QUOTE:
         return "unexpected quote";
      case PARSER_ERROR_UNEXP_EOL:
         return "unexpected end of line";
      default:
         return "unknown error";
   }
}

/* Create a new token */
static int token_create(parser_token_t **head,parser_token_t **last,
                        char *value)
{
   parser_token_t *t;

   if (!(t = malloc(sizeof(*t))))
      return(-1);

   if (!(t->value = strdup(value))) {
      free(t);
      return(-1);
   }

   t->next = NULL;

   if (*last) {
      (*last)->next = t;
      *last = t;
   } else {
      *head = *last = t;
   }

   return(0);
}

/* Free a token list */
void parser_free_tokens(parser_token_t *tok_list)
{
   parser_token_t *t,*next;
   
   for(t=tok_list;t;t=next) {
      next = t->next;
      free(t->value);
      free(t);
   }
}

/* Dump a token list */
void parser_dump_tokens(parser_token_t *tok_list)
{
   parser_token_t *t;

   for(t=tok_list;t;t=t->next)
      printf("\"%s\" ",t->value);
}

/* Map a token list to an array */
char **parser_map_array(parser_token_t *tok_list,int tok_count)
{
   char **map;
   int i;

   if (tok_count <= 0)
      return NULL;

   if (!(map = calloc(tok_count,sizeof(char **))))
      return NULL;

   for(i=0;(i<tok_count) && tok_list;i++,tok_list=tok_list->next)
      map[i] = tok_list->value;

   return map;
}

/* Add a character to a buffer */
static int buffer_add_char(char *buffer,int *pos,char c)
{
   if (*pos >= TOKEN_MAX_SIZE)
      return(-1);

   buffer[(*pos)++] = c;
   buffer[*pos] = 0;
   return(0);
}

/* Tokenize a string */
int parser_tokenize(char *str,struct parser_token **tokens,int *tok_count)
{
   char buffer[TOKEN_MAX_SIZE+1];
   parser_token_t *tok_head,*tok_last;
   int i,buf_pos,type;
   int state,error,done;
   size_t len;
   char c;

   len        = strlen(str);
   tok_head   = tok_last = NULL;
   *tokens    = NULL;
   *tok_count = 0;
   state      = PARSER_STATE_BLANK;
   done       = FALSE;
   error      = 0;
   buf_pos    = 0;

   for(i=0;(i<len+1) && !error && !done;i++)
   {
      c = str[i];
      
      /* Determine character type */
      switch(c) {
         case '\n':
         case '\r':
         case 0:
            type = PARSER_CHAR_NEWLINE;
            break;
         case '\t':
         case ' ':
            type = PARSER_CHAR_BLANK;
            break;
         case '!':
         case '#':
            type = PARSER_CHAR_COMMENT;
            break;
         case '"':
            type = PARSER_CHAR_QUOTE;
            break;
         default:
            type = PARSER_CHAR_OTHER;
      }

      /* Basic finite state machine */
      switch(state) {
         case PARSER_STATE_BLANK:
            switch(type) {
               case PARSER_CHAR_BLANK:
                  /* Eat space */
                  break;

               case PARSER_CHAR_NEWLINE:
               case PARSER_CHAR_COMMENT:
                  done = TRUE;
                  break;

               case PARSER_CHAR_QUOTE:
                  state = PARSER_STATE_QUOTED_STRING;
                  buf_pos = 0;
                  break;
                  
               default:
                  /* Begin a new string */
                  state = PARSER_STATE_STRING;                  
                  buf_pos = 0;
                  buffer_add_char(buffer,&buf_pos,c);
            }
            break;

         case PARSER_STATE_STRING:
            switch(type) {
               case PARSER_CHAR_BLANK:
                  if (token_create(&tok_head,&tok_last,buffer) == -1)
                     error = PARSER_ERROR_NOMEM;

                  (*tok_count)++;
                  state = PARSER_STATE_BLANK;
                  break;

               case PARSER_CHAR_NEWLINE:
                  if (token_create(&tok_head,&tok_last,buffer) == -1)
                     error = PARSER_ERROR_NOMEM;

                  (*tok_count)++;
                  done = TRUE;
                  break;

               case PARSER_CHAR_COMMENT:
                  done = TRUE;
                  break;

               case PARSER_CHAR_QUOTE:
                  error = PARSER_ERROR_UNEXP_QUOTE;
                  break;

               default:
                  /* Add the character to the buffer */
                  buffer_add_char(buffer,&buf_pos,c);
            }
            break;

         case PARSER_STATE_QUOTED_STRING:
            switch(type) {
               case PARSER_CHAR_NEWLINE:
                  /* Unterminated string! */
                  error = PARSER_ERROR_UNEXP_EOL;
                  break;

               case PARSER_CHAR_QUOTE:
                  if (token_create(&tok_head,&tok_last,buffer) == -1)
                     error = PARSER_ERROR_NOMEM;

                  (*tok_count)++;
                  state = PARSER_STATE_BLANK;
                  break;

               default:
                  /* Add the character to the buffer */
                  buffer_add_char(buffer,&buf_pos,c);
            }
            break;
      }
   }

   if (error) {
      parser_free_tokens(tok_head);
      return(error);
   }

   *tokens = tok_head;
   return(0);
}

/* Parser tests */
static char *parser_test_str[] = {
   "c7200 show_hardware R1",
   "c7200 show_hardware \"R1\"",
   "   c7200    show_hardware   \"R1\"    ",
   "\"c7200\" \"show_hardware\" \"R1\"",
   "hypervisor set_working_dir \"C:\\Program Files\\Dynamips Test\"",
   "hypervisor # This is a comment set_working_dir \"C:\\Program Files\"",
   "\"c7200\" \"show_hardware\" \"R1",
   NULL,
};

void parser_run_tests(void)
{
   struct parser_token *tok_list;
   int i,res,tok_count;

   for(i=0;parser_test_str[i];i++) {
      res = parser_tokenize(parser_test_str[i],&tok_list,&tok_count);

      printf("\n%d: Test string: [%s] => res=%d\n",
             i,parser_test_str[i],res);
      
      if (tok_list) {
         printf("Tokens: ");
         parser_dump_tokens(tok_list);
         printf("\n");

         parser_free_tokens(tok_list);
      }
   }
}
1	/*
2	* Cisco 7200 (Predator) simulation platform.
3	* Copyright (c) 2006 Christophe Fillot (cf@utc.fr)
4	*
5	* Mini-parser.
6	*/
7
8	#include <stdio.h>
9	#include <stdlib.h>
10	#include <unistd.h>
11	#include <string.h>
12	#include <sys/types.h>
13	#include <sys/stat.h>
14	#include <sys/mman.h>
15	#include <signal.h>
16	#include <fcntl.h>
17	#include <errno.h>
18	#include <assert.h>
19	#include <stdarg.h>
20	#include <sys/ioctl.h>
21	#include <sys/types.h>
22	#include <sys/socket.h>
23	#include <arpa/inet.h>
24
25	#include "utils.h"
26	#include "parser.h"
27
28	#define TOKEN_MAX_SIZE 512
29
30	/* Parser states */
31	enum {
32	PARSER_STATE_BLANK,
33	PARSER_STATE_STRING,
34	PARSER_STATE_QUOTED_STRING,
35	};
36
37	/* Character types */
38	enum {
39	PARSER_CHAR_BLANK,
40	PARSER_CHAR_NEWLINE,
41	PARSER_CHAR_COMMENT,
42	PARSER_CHAR_QUOTE,
43	PARSER_CHAR_OTHER,
44	};
45
46	/* Get a description given an error code */
47	char *parser_strerror(int error)
48	{
49	printf("error = %d\n",error);
50
51	switch(error) {
52	case PARSER_ERROR_NOMEM:
53	return "insufficient memory";
54	case PARSER_ERROR_UNEXP_QUOTE:
55	return "unexpected quote";
56	case PARSER_ERROR_UNEXP_EOL:
57	return "unexpected end of line";
58	default:
59	return "unknown error";
60	}
61	}
62
63	/* Create a new token */
64	static int token_create(parser_token_t head,parser_token_t last,
65	char *value)
66	{
67	parser_token_t *t;
68
69	if (!(t = malloc(sizeof(*t))))
70	return(-1);
71
72	if (!(t->value = strdup(value))) {
73	free(t);
74	return(-1);
75	}
76
77	t->next = NULL;
78
79	if (*last) {
80	(*last)->next = t;
81	*last = t;
82	} else {
83	head = last = t;
84	}
85
86	return(0);
87	}
88
89	/* Free a token list */
90	void parser_free_tokens(parser_token_t *tok_list)
91	{
92	parser_token_t t,next;
93
94	for(t=tok_list;t;t=next) {
95	next = t->next;
96	free(t->value);
97	free(t);
98	}
99	}
100
101	/* Dump a token list */
102	void parser_dump_tokens(parser_token_t *tok_list)
103	{
104	parser_token_t *t;
105
106	for(t=tok_list;t;t=t->next)
107	printf("\"%s\" ",t->value);
108	}
109
110	/* Map a token list to an array */
111	char *parser_map_array(parser_token_t tok_list,int tok_count)
112	{
113	char **map;
114	int i;
115
116	if (tok_count <= 0)
117	return NULL;
118
119	if (!(map = calloc(tok_count,sizeof(char **))))
120	return NULL;
121
122	for(i=0;(i<tok_count) && tok_list;i++,tok_list=tok_list->next)
123	map[i] = tok_list->value;
124
125	return map;
126	}
127
128	/* Add a character to a buffer */
129	static int buffer_add_char(char buffer,int pos,char c)
130	{
131	if (*pos >= TOKEN_MAX_SIZE)
132	return(-1);
133
134	buffer[(*pos)++] = c;
135	buffer[*pos] = 0;
136	return(0);
137	}
138
139	/* Tokenize a string */
140	int parser_tokenize(char str,struct parser_token tokens,int tok_count)
141	{
142	char buffer[TOKEN_MAX_SIZE+1];
143	parser_token_t tok_head,tok_last;
144	int i,buf_pos,type;
145	int state,error,done;
146	size_t len;
147	char c;
148
149	len = strlen(str);
150	tok_head = tok_last = NULL;
151	*tokens = NULL;
152	*tok_count = 0;
153	state = PARSER_STATE_BLANK;
154	done = FALSE;
155	error = 0;
156	buf_pos = 0;
157
158	for(i=0;(i<len+1) && !error && !done;i++)
159	{
160	c = str[i];
161
162	/* Determine character type */
163	switch(c) {
164	case '\n':
165	case '\r':
166	case 0:
167	type = PARSER_CHAR_NEWLINE;
168	break;
169	case '\t':
170	case ' ':
171	type = PARSER_CHAR_BLANK;
172	break;
173	case '!':
174	case '#':
175	type = PARSER_CHAR_COMMENT;
176	break;
177	case '"':
178	type = PARSER_CHAR_QUOTE;
179	break;
180	default:
181	type = PARSER_CHAR_OTHER;
182	}
183
184	/* Basic finite state machine */
185	switch(state) {
186	case PARSER_STATE_BLANK:
187	switch(type) {
188	case PARSER_CHAR_BLANK:
189	/* Eat space */
190	break;
191
192	case PARSER_CHAR_NEWLINE:
193	case PARSER_CHAR_COMMENT:
194	done = TRUE;
195	break;
196
197	case PARSER_CHAR_QUOTE:
198	state = PARSER_STATE_QUOTED_STRING;
199	buf_pos = 0;
200	break;
201
202	default:
203	/* Begin a new string */
204	state = PARSER_STATE_STRING;
205	buf_pos = 0;
206	buffer_add_char(buffer,&buf_pos,c);
207	}
208	break;
209
210	case PARSER_STATE_STRING:
211	switch(type) {
212	case PARSER_CHAR_BLANK:
213	if (token_create(&tok_head,&tok_last,buffer) == -1)
214	error = PARSER_ERROR_NOMEM;
215
216	(*tok_count)++;
217	state = PARSER_STATE_BLANK;
218	break;
219
220	case PARSER_CHAR_NEWLINE:
221	if (token_create(&tok_head,&tok_last,buffer) == -1)
222	error = PARSER_ERROR_NOMEM;
223
224	(*tok_count)++;
225	done = TRUE;
226	break;
227
228	case PARSER_CHAR_COMMENT:
229	done = TRUE;
230	break;
231
232	case PARSER_CHAR_QUOTE:
233	error = PARSER_ERROR_UNEXP_QUOTE;
234	break;
235
236	default:
237	/* Add the character to the buffer */
238	buffer_add_char(buffer,&buf_pos,c);
239	}
240	break;
241
242	case PARSER_STATE_QUOTED_STRING:
243	switch(type) {
244	case PARSER_CHAR_NEWLINE:
245	/* Unterminated string! */
246	error = PARSER_ERROR_UNEXP_EOL;
247	break;
248
249	case PARSER_CHAR_QUOTE:
250	if (token_create(&tok_head,&tok_last,buffer) == -1)
251	error = PARSER_ERROR_NOMEM;
252
253	(*tok_count)++;
254	state = PARSER_STATE_BLANK;
255	break;
256
257	default:
258	/* Add the character to the buffer */
259	buffer_add_char(buffer,&buf_pos,c);
260	}
261	break;
262	}
263	}
264
265	if (error) {
266	parser_free_tokens(tok_head);
267	return(error);
268	}
269
270	*tokens = tok_head;
271	return(0);
272	}
273
274	/* Parser tests */
275	static char *parser_test_str[] = {
276	"c7200 show_hardware R1",
277	"c7200 show_hardware \"R1\"",
278	" c7200 show_hardware \"R1\" ",
279	"\"c7200\" \"show_hardware\" \"R1\"",
280	"hypervisor set_working_dir \"C:\\Program Files\\Dynamips Test\"",
281	"hypervisor # This is a comment set_working_dir \"C:\\Program Files\"",
282	"\"c7200\" \"show_hardware\" \"R1",
283	NULL,
284	};
285
286	void parser_run_tests(void)
287	{
288	struct parser_token *tok_list;
289	int i,res,tok_count;
290
291	for(i=0;parser_test_str[i];i++) {
292	res = parser_tokenize(parser_test_str[i],&tok_list,&tok_count);
293
294	printf("\n%d: Test string: [%s] => res=%d\n",
295	i,parser_test_str[i],res);
296
297	if (tok_list) {
298	printf("Tokens: ");
299	parser_dump_tokens(tok_list);
300	printf("\n");
301
302	parser_free_tokens(tok_list);
303	}
304	}
305	}