masqmail-0.2

diff src/parse.c @ 0:08114f7dcc23

this is masqmail-0.2.21 from oliver kurth
author meillo@marmaro.de
date Fri, 26 Sep 2008 17:05:23 +0200
parents
children 26e34ae9a3e3
line diff
     1.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     1.2 +++ b/src/parse.c	Fri Sep 26 17:05:23 2008 +0200
     1.3 @@ -0,0 +1,450 @@
     1.4 +/*  MasqMail
     1.5 +    Copyright (C) 1999-2001 Oliver Kurth
     1.6 +
     1.7 +    This program is free software; you can redistribute it and/or modify
     1.8 +    it under the terms of the GNU General Public License as published by
     1.9 +    the Free Software Foundation; either version 2 of the License, or
    1.10 +    (at your option) any later version.
    1.11 +
    1.12 +    This program is distributed in the hope that it will be useful,
    1.13 +    but WITHOUT ANY WARRANTY; without even the implied warranty of
    1.14 +    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    1.15 +    GNU General Public License for more details.
    1.16 +
    1.17 +    You should have received a copy of the GNU General Public License
    1.18 +    along with this program; if not, write to the Free Software
    1.19 +    Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
    1.20 +*/
    1.21 +
    1.22 +#ifndef PARSE_TEST
    1.23 +#include "masqmail.h"
    1.24 +#endif
    1.25 +
    1.26 +/* This is really dangerous. I hope that I was careful enough,
    1.27 +   but maybe there is some malformed address possible that causes
    1.28 +   this to segfault or be caught in endless loops.
    1.29 +
    1.30 +   If you find something like that, PLEASE mail the string to me
    1.31 +   (no matter how idiotic it is), so that I can debug that.
    1.32 +   Those things really should not happen.
    1.33 +*/
    1.34 +
    1.35 +static gchar *specials = "()<>@,;:\\\".[]`";
    1.36 +
    1.37 +char *parse_error = NULL;
    1.38 +
    1.39 +static
    1.40 +gchar *skip_comment(gchar *p)
    1.41 +{
    1.42 +
    1.43 +#ifdef PARSE_TEST
    1.44 +  g_print("skip_comment: %s\n", p);
    1.45 +#endif
    1.46 +
    1.47 +  p++;
    1.48 +  while(*p && *p != ')'){
    1.49 +    p++;
    1.50 +    if(*p == '(')
    1.51 +      p = skip_comment(p);
    1.52 +  }
    1.53 +  p++;
    1.54 +
    1.55 +  return p;
    1.56 +}
    1.57 +
    1.58 +static
    1.59 +gboolean read_word(gchar *p, gchar **b, gchar **e)
    1.60 +{
    1.61 +#ifdef PARSE_TEST
    1.62 +  g_print("read_word: %s\n", p);
    1.63 +#endif
    1.64 +  /* eat leading spaces */
    1.65 +  while(*p && isspace(*p)) p++;
    1.66 +  
    1.67 +  *b = p;
    1.68 +  /*  b = &p;*/
    1.69 +  if(*p == '\"'){
    1.70 +    /* quoted-string */
    1.71 +    p++;
    1.72 +    while(*p && (*p != '\"')) p++;
    1.73 +    p++;
    1.74 +  }else{
    1.75 +    /* atom */
    1.76 +    while(*p && !strchr(specials, *p) && !iscntrl(*p) && !isspace(*p))
    1.77 +      p++;
    1.78 +  }
    1.79 +  *e = p;
    1.80 +  return TRUE;
    1.81 +}
    1.82 +
    1.83 +static
    1.84 +gboolean read_word_with_dots(gchar *p, gchar **b, gchar **e)
    1.85 +{
    1.86 +  gchar *b0 = p;
    1.87 +
    1.88 +#ifdef PARSE_TEST
    1.89 +  g_print("read_word_with_dots: %s\n", p);
    1.90 +#endif
    1.91 +  while(TRUE){
    1.92 +    if(!read_word(p, b, e))
    1.93 +      return FALSE;
    1.94 +    p = *e;
    1.95 +    if(*p != '.') break;
    1.96 +    p++;
    1.97 +  }
    1.98 +  *b = b0;
    1.99 +  *e = p;
   1.100 +  return TRUE;
   1.101 +}
   1.102 +
   1.103 +static
   1.104 +gboolean read_domain(gchar *p, gchar **b, gchar **e)
   1.105 +{
   1.106 +#ifdef PARSE_TEST
   1.107 +  g_print("read_domain: %s\n", p);
   1.108 +#endif
   1.109 +  *b = p;
   1.110 +  if(*p != '['){
   1.111 +    while(isalnum(*p) || (*p == '-') || (*p == '.'))
   1.112 +      p++;
   1.113 +  }else{
   1.114 +    p++;
   1.115 +    while(isalpha(*p) || (*p == '.'))
   1.116 +      p++;
   1.117 +    if(*p != ']'){
   1.118 +      parse_error =
   1.119 +	g_strdup_printf("']' expected at end of literal address %s", *b);
   1.120 +      return FALSE;
   1.121 +    }
   1.122 +    p++;
   1.123 +  }
   1.124 +  *e = p;
   1.125 +  return TRUE;
   1.126 +}
   1.127 +
   1.128 +gboolean parse_address_rfc822(gchar *string,
   1.129 +		       gchar **local_begin, gchar **local_end,
   1.130 +		       gchar **domain_begin, gchar **domain_end,
   1.131 +		       gchar **address_end)
   1.132 +{
   1.133 +  gint angle_brackets = 0;
   1.134 +
   1.135 +  gchar *p = string;
   1.136 +  gchar *b, *e;
   1.137 +
   1.138 +  *local_begin = *local_end = NULL;
   1.139 +  *domain_begin = *domain_end = NULL;
   1.140 +
   1.141 +  /* might be some memory left from previous call: */
   1.142 +  if(parse_error != NULL){
   1.143 +    g_free(parse_error);
   1.144 +    parse_error = NULL;
   1.145 +  }
   1.146 +
   1.147 +  /* leading spaces and angle brackets */
   1.148 +  while(*p && (isspace(*p) || (*p == '<'))){
   1.149 +    if(*p == '<')
   1.150 +      angle_brackets++;
   1.151 +    p++;
   1.152 +  }
   1.153 + 
   1.154 +  if(*p){
   1.155 +    while(TRUE){
   1.156 +      if(read_word_with_dots(p, &b, &e)){
   1.157 +	p = e;
   1.158 +#ifdef PARSE_TEST
   1.159 +	g_print("after read_word_with_dots: %s\n", p);
   1.160 +#endif
   1.161 +	/* eat white spaces and comments */
   1.162 +	while((*p && (isspace(*p))) || (*p == '(')){
   1.163 +	  if(*p == '('){
   1.164 +	    if(!(p = skip_comment(p))){
   1.165 +	      parse_error =
   1.166 +		g_strdup("missing right bracket ')'");
   1.167 +	      return FALSE;
   1.168 +	    }
   1.169 +	  }else
   1.170 +	    p++;
   1.171 +	}
   1.172 +	/* we now have a non-space char that is not
   1.173 +	   the beginning of a comment */
   1.174 +
   1.175 +	if(*p == '@'){
   1.176 +	  /* the last word was the local_part
   1.177 +	     of an addr-spec */
   1.178 +	  *local_begin = b;
   1.179 +	  *local_end = e;
   1.180 +#ifdef PARSE_TEST
   1.181 +	  g_print("found local part: %s\n", *local_begin);
   1.182 +#endif
   1.183 +	  if(*p == '@'){
   1.184 +	    p++; /* skip @ */
   1.185 +	    /* now the domain */
   1.186 +	    if(read_domain(p, &b, &e)){
   1.187 +	      p = e;
   1.188 +	      *domain_begin = b;
   1.189 +	      *domain_end = e;
   1.190 +	    }
   1.191 +	    else
   1.192 +	      return FALSE;
   1.193 +	  }else{
   1.194 +	    /* unqualified? */
   1.195 +	    *domain_begin = *domain_end = NULL;
   1.196 +	  }
   1.197 +	  break;
   1.198 +	}else if(*p == '<'){
   1.199 +	  /* addr-spec follows */
   1.200 +	  while(isspace(*p) || (*p == '<')){
   1.201 +	    if(*p == '<')
   1.202 +	      angle_brackets++;
   1.203 +	    p++;
   1.204 +	  }
   1.205 +	  if(read_word_with_dots(p, &b, &e)){
   1.206 +	    p = e;
   1.207 +	    *local_begin = b;
   1.208 +	    *local_end = e;
   1.209 +#ifdef PARSE_TEST
   1.210 +	  g_print("found local part: %s\n", *local_begin);
   1.211 +#endif
   1.212 +	  }else
   1.213 +	    return FALSE;
   1.214 +	  if(*p == '@'){
   1.215 +	    p++;
   1.216 +	    if(read_domain(p, &b, &e)){
   1.217 +	      p = e;
   1.218 +	      *domain_begin = b;
   1.219 +	      *domain_end = e;
   1.220 +	    }else
   1.221 +	      return FALSE;
   1.222 +	  }else{
   1.223 +	    /* may be unqualified address */
   1.224 +	    *domain_begin = *domain_end = NULL;
   1.225 +	  }
   1.226 +	  break;
   1.227 +	}else if(!*p || *p == '>'){
   1.228 +	  *local_begin = b;
   1.229 +	  *local_end = e;
   1.230 +#ifdef PARSE_TEST
   1.231 +	  g_print("found local part: %s\n", *local_begin);
   1.232 +#endif
   1.233 +	  *domain_begin = *domain_end = NULL;
   1.234 +	  break;
   1.235 +	}else if(strchr(specials, *p) || iscntrl(*p) || isspace(*p)){
   1.236 +	  parse_error = g_strdup_printf("unexpected character: %c", *p);
   1.237 +	  return FALSE;
   1.238 +	}
   1.239 +      }else
   1.240 +	return FALSE;
   1.241 +    }
   1.242 +   /* trailing spaces and angle brackets */
   1.243 +#ifdef PARSE_TEST
   1.244 +    g_print("down counting trailing '>'\n");
   1.245 +#endif
   1.246 +    while(*p && (isspace(*p) || (*p == '>'))){
   1.247 +      if(*p == '>')
   1.248 +	angle_brackets--;
   1.249 +      p++;
   1.250 +    }
   1.251 +
   1.252 +    *address_end = p;
   1.253 +
   1.254 +    if(angle_brackets != 0){
   1.255 +      if(angle_brackets > 0)
   1.256 +	parse_error = g_strdup("missing '>' at end of string");
   1.257 +      else
   1.258 +	parse_error = g_strdup("superfluous '>' at end of string");
   1.259 +      return FALSE;
   1.260 +    }else{
   1.261 +      /* we successfully parsed the address */
   1.262 +      return TRUE;
   1.263 +    }
   1.264 +    /* we never get here */
   1.265 +  }
   1.266 +  return FALSE;
   1.267 +}
   1.268 +
   1.269 +gboolean parse_address_rfc821(gchar *string,
   1.270 +			      gchar **local_begin, gchar **local_end,
   1.271 +			      gchar **domain_begin, gchar **domain_end,
   1.272 +			      gchar **address_end)
   1.273 +{
   1.274 +  gint angle_brackets = 0;
   1.275 +
   1.276 +  gchar *p = string;
   1.277 +  gchar *b, *e;
   1.278 +
   1.279 +  *local_begin = *local_end = NULL;
   1.280 +  *domain_begin = *domain_end = NULL;
   1.281 +
   1.282 +  /* might be some memory left from previous call: */
   1.283 +  if(parse_error != NULL){
   1.284 +    g_free(parse_error);
   1.285 +    parse_error = NULL;
   1.286 +  }
   1.287 +
   1.288 +  /* leading spaces and angle brackets */
   1.289 +  while(*p && (isspace(*p) || (*p == '<'))){
   1.290 +    if(*p == '<')
   1.291 +      angle_brackets++;
   1.292 +    p++;
   1.293 +  }
   1.294 + 
   1.295 +  if(*p){
   1.296 +    while(TRUE){
   1.297 +      if(read_word_with_dots(p, &b, &e)){
   1.298 +	p = e;
   1.299 +#ifdef PARSE_TEST
   1.300 +	g_print("after read_word_with_dots: %s\n", p);
   1.301 +#endif
   1.302 +	*local_begin = b;
   1.303 +	*local_end = e;
   1.304 +#ifdef PARSE_TEST
   1.305 +	  g_print("found local part: %s\n", *local_begin);
   1.306 +	  g_print("local_end = %s\n", *local_end);
   1.307 +#endif
   1.308 +	if(!(*p) || isspace(*p) || (*p == '>')){
   1.309 +	  /* unqualified ?*/
   1.310 +	  domain_begin = domain_end = NULL;
   1.311 +	  break;
   1.312 +	}else if(*p == '@'){
   1.313 +	  p++;
   1.314 +	  if(read_domain(p, &b, &e)){
   1.315 +	    p = e;
   1.316 +	    *domain_begin = b;
   1.317 +	    *domain_end = e;
   1.318 +	  }
   1.319 +	  break;
   1.320 +	}else{
   1.321 +	  parse_error =
   1.322 +	      g_strdup_printf("unexpected character after local part '%c'",*p);
   1.323 +	  return FALSE;
   1.324 +	}
   1.325 +      } else
   1.326 +         return FALSE;
   1.327 +    }
   1.328 +
   1.329 +    /* trailing spaces and angle brackets */
   1.330 +#ifdef PARSE_TEST
   1.331 +    g_print("down counting trailing '>'\n");
   1.332 +#endif
   1.333 +    while(*p && (isspace(*p) || (*p == '>'))){
   1.334 +      if(*p == '>')
   1.335 +	angle_brackets--;
   1.336 +      p++;
   1.337 +    }
   1.338 +    *address_end = p;
   1.339 +
   1.340 +    if(angle_brackets != 0){
   1.341 +      if(angle_brackets > 0)
   1.342 +	parse_error = g_strdup("missing '>' at end of string");
   1.343 +      else
   1.344 +	parse_error = g_strdup("superfluous '>' at end of string");
   1.345 +      return FALSE;
   1.346 +    }else{
   1.347 +      /* we successfully parsed the address */
   1.348 +      return TRUE;
   1.349 +    }
   1.350 +    /* we never get here */
   1.351 +  }
   1.352 +  return FALSE;
   1.353 +}
   1.354 +
   1.355 +/*
   1.356 +  allocate address, reading from string.
   1.357 +  On failure, returns NULL.
   1.358 +  after call, end contatins a pointer to the end of the parsed string
   1.359 +  end may be NULL, if we are not interested.
   1.360 +
   1.361 +  parses both rfc 821 and rfc 822 addresses, depending on flag is_rfc821
   1.362 +*/
   1.363 +
   1.364 +address *_create_address(gchar *string, gchar **end, gboolean is_rfc821)
   1.365 +{
   1.366 +  gchar *loc_beg, *loc_end;
   1.367 +  gchar *dom_beg, *dom_end;
   1.368 +  gchar *addr_end;
   1.369 +
   1.370 +  if (string && (string[0] == 0)) {
   1.371 +    address *addr = g_malloc(sizeof(address));
   1.372 +    addr->address = g_strdup("");
   1.373 +    addr->local_part = g_strdup("");
   1.374 +    addr->domain = g_strdup(""); /* 'NULL' address (failure notice),
   1.375 +        "" makes sure it will not be qualified with a hostname */
   1.376 +    return addr;
   1.377 +  }
   1.378 +
   1.379 +  if(is_rfc821 ?
   1.380 +     parse_address_rfc821(string,
   1.381 +			  &loc_beg, &loc_end, &dom_beg, &dom_end, &addr_end) :
   1.382 +     parse_address_rfc822(string,
   1.383 +			  &loc_beg, &loc_end, &dom_beg, &dom_end, &addr_end)){
   1.384 +    address *addr = g_malloc(sizeof(address));
   1.385 +    gchar *p = addr_end;
   1.386 +    
   1.387 +
   1.388 +    memset(addr, 0, sizeof(address));
   1.389 +
   1.390 +    if(loc_beg[0] == '|'){
   1.391 +      parse_error = g_strdup("no pipe allowed for RFC 822/821 address");
   1.392 +      return NULL;
   1.393 +    }
   1.394 +
   1.395 +    while(*p && (*p != ',')) p++;
   1.396 +    addr->address = g_strndup(string, p - string);
   1.397 +
   1.398 +    addr->local_part = g_strndup(loc_beg, loc_end - loc_beg);
   1.399 +
   1.400 +#ifdef PARSE_TEST
   1.401 +    g_print("addr->local_part = %s\n", addr->local_part);
   1.402 +#endif
   1.403 +
   1.404 +    if(dom_beg != NULL){
   1.405 +      addr->domain = g_strndup(dom_beg, dom_end - dom_beg);
   1.406 +    }else{
   1.407 +      if(addr->local_part[0] == 0)
   1.408 +	addr->domain = g_strdup(""); /* 'NULL' address (failure notice),
   1.409 +		      "" makes sure it will not be qualified with a hostname */
   1.410 +      else
   1.411 +	addr->domain = NULL;
   1.412 +    }
   1.413 +
   1.414 +    if(end != NULL)
   1.415 +      *end = p;
   1.416 +
   1.417 +#ifndef PARSE_TEST
   1.418 +    addr_unmark_delivered(addr);
   1.419 +#endif
   1.420 +
   1.421 +    return addr;
   1.422 +  }
   1.423 +  return NULL;
   1.424 +}
   1.425 +
   1.426 +address *create_address_rfc822(gchar *string, gchar **end){
   1.427 +  return _create_address(string, end, FALSE);
   1.428 +}
   1.429 +
   1.430 +address *create_address_rfc821(gchar *string, gchar **end){
   1.431 +  return _create_address(string, end, TRUE);
   1.432 +}
   1.433 +
   1.434 +GList *addr_list_append_rfc822(GList *addr_list, gchar *string, gchar *domain)
   1.435 +{
   1.436 +  gchar *p = string;
   1.437 +  gchar *end;
   1.438 +
   1.439 +  while(*p){
   1.440 +    address *addr = _create_address(p, &end, FALSE);
   1.441 +    if(addr){
   1.442 +      if(domain)
   1.443 +	if(addr->domain == NULL)
   1.444 +	  addr->domain = g_strdup(domain);
   1.445 +
   1.446 +      addr_list = g_list_append(addr_list, addr);
   1.447 +      p = end;
   1.448 +    }else
   1.449 +      break;
   1.450 +    while(*p == ',' || isspace(*p)) p++;
   1.451 +  }
   1.452 +  return addr_list;
   1.453 +}