diff options
| author | Paul Jakma <paul@quagga.net> | 2010-11-23 16:35:42 +0000 | 
|---|---|---|
| committer | Paul Jakma <paul@quagga.net> | 2011-03-21 13:51:14 +0000 | 
| commit | b881c7074bb698aeb1b099175b325734fc6e44d2 (patch) | |
| tree | 70b4816a083166bbf00c1f85f19a67df0c0a5948 /bgpd/bgp_packet.c | |
| parent | c112af27ed8f158ecece0d73ce2016c166076c00 (diff) | |
bgpd: Implement revised error handling for partial optional/trans. attributes
* BGP error handling generally boils down to "reset session". This was fine
  when all BGP speakers pretty much understood all BGP messages. However
  the increasing deployment of new attribute types has shown this approach
  to cause problems, in particular where a new attribute type is "tunneled"
  over some speakers which do not understand it, and then arrives at a speaker
  which does but considers it malformed (e.g. corruption along the way, or
  because of early implementation bugs/interop issues).
  To mitigate this drafts before the IDR (likely to be adopted) propose to
  treat errors in partial (i.e.  not understood by neighbour), optional
  transitive attributes, when received from eBGP peers, as withdrawing only
  the NLRIs in the affected UPDATE, rather than causing the entire session
  to be reset.  See:
   http://tools.ietf.org/html/draft-scudder-idr-optional-transitive
* bgp_aspath.c: (assegments_parse) Replace the "NULL means valid, 0-length
  OR an error" return value with an error code - instead taking
  pointer to result structure as arg.
  (aspath_parse) adjust to suit previous change, but here NULL really
  does mean error in the external interface.
* bgp_attr.h (bgp_attr_parse) use an explictly typed and enumerated
  value to indicate return result.
  (bgp_attr_unintern_sub) cleans up just the members of an attr, but not the
  attr itself, for benefit of those who use a stack-local attr.
* bgp_attr.c: (bgp_attr_unintern_sub) split out from bgp_attr_unintern
  (bgp_attr_unintern) as previous.
  (bgp_attr_malformed) helper function to centralise decisions on how to
  handle errors in attributes.
  (bgp_attr_{aspathlimit,origin,etc..}) Use bgp_attr_malformed.
  (bgp_attr_aspathlimit) Subcode for error specifc to this attr should be
  BGP_NOTIFY_UPDATE_OPT_ATTR_ERR.
  (bgp_attr_as4_path) be more rigorous about checks, ala bgp_attr_as_path.
  (bgp_attr_parse) Adjust to deal with the additional error level that
  bgp_attr_ parsers can raise, and also similarly return appropriate
  error back up to (bgp_update_receive). Try to avoid leaking as4_path.
* bgp_packet.c: (bgp_update_receive) Adjust to deal with BGP_ATTR_PARSE_WITHDRAW
  error level from bgp_attr_parse, which should lead to a withdraw, by
  making the attribute parameter in call to (bgp_nlri_parse) conditional
  on the error, so the update case morphs also into a withdraw.
  Use bgp_attr_unintern_sub from above, instead of doing this itself.
  Fix error case returns which were not calling bgp_attr_unintern_sub
  and probably leaking memory.
* tests/aspath_test.c: Fix to work for null return with bad segments
Diffstat (limited to 'bgpd/bgp_packet.c')
| -rw-r--r-- | bgpd/bgp_packet.c | 76 | 
1 files changed, 48 insertions, 28 deletions
| diff --git a/bgpd/bgp_packet.c b/bgpd/bgp_packet.c index dee0b51f..8de78c75 100644 --- a/bgpd/bgp_packet.c +++ b/bgpd/bgp_packet.c @@ -1589,26 +1589,47 @@ bgp_update_receive (struct peer *peer, bgp_size_t size)  		       BGP_NOTIFY_UPDATE_MAL_ATTR);        return -1;      } +   +  /* Certain attribute parsing errors should not be considered bad enough +   * to reset the session for, most particularly any partial/optional +   * attributes that have 'tunneled' over speakers that don't understand +   * them. Instead we withdraw only the prefix concerned. +   *  +   * Complicates the flow a little though.. +   */ +  bgp_attr_parse_ret_t attr_parse_ret = BGP_ATTR_PARSE_PROCEED; +  /* This define morphs the update case into a withdraw when lower levels +   * have signalled an error condition where this is best. +   */ +#define NLRI_ATTR_ARG (attr_parse_ret != BGP_ATTR_PARSE_WITHDRAW ? &attr : NULL)    /* Parse attribute when it exists. */    if (attribute_len)      { -      ret = bgp_attr_parse (peer, &attr, attribute_len,  +      attr_parse_ret = bgp_attr_parse (peer, &attr, attribute_len,   			    &mp_update, &mp_withdraw); -      if (ret < 0) +      if (attr_parse_ret == BGP_ATTR_PARSE_ERROR)  	return -1;      } - +      /* Logging the attribute. */ -  if (BGP_DEBUG (update, UPDATE_IN)) +  if (attr_parse_ret == BGP_ATTR_PARSE_WITHDRAW +      || BGP_DEBUG (update, UPDATE_IN))      {        ret= bgp_dump_attr (peer, &attr, attrstr, BUFSIZ); +      int lvl = (attr_parse_ret == BGP_ATTR_PARSE_WITHDRAW) +                 ? LOG_ERR : LOG_DEBUG; +       +      if (attr_parse_ret == BGP_ATTR_PARSE_WITHDRAW) +        zlog (peer->log, LOG_ERR, +              "%s rcvd UPDATE with errors in attr(s)!! Withdrawing route.", +              peer->host);        if (ret) -	zlog (peer->log, LOG_DEBUG, "%s rcvd UPDATE w/ attr: %s", +	zlog (peer->log, lvl, "%s rcvd UPDATE w/ attr: %s",  	      peer->host, attrstr);      } - +      /* Network Layer Reachability Information. */    update_len = end - stream_pnt (s); @@ -1617,7 +1638,12 @@ bgp_update_receive (struct peer *peer, bgp_size_t size)        /* Check NLRI packet format and prefix length. */        ret = bgp_nlri_sanity_check (peer, AFI_IP, stream_pnt (s), update_len);        if (ret < 0) -	return -1; +        { +          bgp_attr_unintern_sub (&attr); +          if (attr.extra) +            bgp_attr_extra_free (&attr); +	  return -1; +	}        /* Set NLRI portion to structure. */        update.afi = AFI_IP; @@ -1640,15 +1666,20 @@ bgp_update_receive (struct peer *peer, bgp_size_t size)  	     update. */  	  ret = bgp_attr_check (peer, &attr);  	  if (ret < 0) -	    return -1; +	    { +	      bgp_attr_unintern_sub (&attr); +              if (attr.extra) +                bgp_attr_extra_free (&attr); +	      return -1; +            } -	  bgp_nlri_parse (peer, &attr, &update); +	  bgp_nlri_parse (peer, NLRI_ATTR_ARG, &update);  	}        if (mp_update.length  	  && mp_update.afi == AFI_IP   	  && mp_update.safi == SAFI_UNICAST) -	bgp_nlri_parse (peer, &attr, &mp_update); +	bgp_nlri_parse (peer, NLRI_ATTR_ARG, &mp_update);        if (mp_withdraw.length  	  && mp_withdraw.afi == AFI_IP  @@ -1675,7 +1706,7 @@ bgp_update_receive (struct peer *peer, bgp_size_t size)        if (mp_update.length  	  && mp_update.afi == AFI_IP   	  && mp_update.safi == SAFI_MULTICAST) -	bgp_nlri_parse (peer, &attr, &mp_update); +	bgp_nlri_parse (peer, NLRI_ATTR_ARG, &mp_update);        if (mp_withdraw.length  	  && mp_withdraw.afi == AFI_IP  @@ -1705,7 +1736,7 @@ bgp_update_receive (struct peer *peer, bgp_size_t size)        if (mp_update.length   	  && mp_update.afi == AFI_IP6   	  && mp_update.safi == SAFI_UNICAST) -	bgp_nlri_parse (peer, &attr, &mp_update); +	bgp_nlri_parse (peer, NLRI_ATTR_ARG, &mp_update);        if (mp_withdraw.length   	  && mp_withdraw.afi == AFI_IP6  @@ -1734,7 +1765,7 @@ bgp_update_receive (struct peer *peer, bgp_size_t size)        if (mp_update.length   	  && mp_update.afi == AFI_IP6   	  && mp_update.safi == SAFI_MULTICAST) -	bgp_nlri_parse (peer, &attr, &mp_update); +	bgp_nlri_parse (peer, NLRI_ATTR_ARG, &mp_update);        if (mp_withdraw.length   	  && mp_withdraw.afi == AFI_IP6  @@ -1762,7 +1793,7 @@ bgp_update_receive (struct peer *peer, bgp_size_t size)        if (mp_update.length   	  && mp_update.afi == AFI_IP   	  && mp_update.safi == BGP_SAFI_VPNV4) -	bgp_nlri_parse_vpnv4 (peer, &attr, &mp_update); +	bgp_nlri_parse_vpnv4 (peer, NLRI_ATTR_ARG, &mp_update);        if (mp_withdraw.length   	  && mp_withdraw.afi == AFI_IP  @@ -1784,21 +1815,10 @@ bgp_update_receive (struct peer *peer, bgp_size_t size)    /* Everything is done.  We unintern temporary structures which       interned in bgp_attr_parse(). */ -  if (attr.aspath) -    aspath_unintern (&attr.aspath); -  if (attr.community) -    community_unintern (&attr.community); +  bgp_attr_unintern_sub (&attr);    if (attr.extra) -    { -      if (attr.extra->ecommunity) -        ecommunity_unintern (&attr.extra->ecommunity); -      if (attr.extra->cluster) -        cluster_unintern (attr.extra->cluster); -      if (attr.extra->transit) -        transit_unintern (attr.extra->transit); -      bgp_attr_extra_free (&attr); -    } - +    bgp_attr_extra_free (&attr); +      /* If peering is stopped due to some reason, do not generate BGP       event.  */    if (peer->status != Established) | 
