Annotation of embedaddon/bird/proto/bgp/attrs.c, revision 1.1

1.1     ! misho       1: /*
        !             2:  *     BIRD -- BGP Attributes
        !             3:  *
        !             4:  *     (c) 2000 Martin Mares <mj@ucw.cz>
        !             5:  *
        !             6:  *     Can be freely distributed and used under the terms of the GNU GPL.
        !             7:  */
        !             8: 
        !             9: #undef LOCAL_DEBUG
        !            10: 
        !            11: #include <stdlib.h>
        !            12: 
        !            13: #include "nest/bird.h"
        !            14: #include "nest/iface.h"
        !            15: #include "nest/protocol.h"
        !            16: #include "nest/route.h"
        !            17: #include "nest/attrs.h"
        !            18: #include "conf/conf.h"
        !            19: #include "lib/resource.h"
        !            20: #include "lib/string.h"
        !            21: #include "lib/unaligned.h"
        !            22: 
        !            23: #include "bgp.h"
        !            24: 
        !            25: /*
        !            26:  *   UPDATE message error handling
        !            27:  *
        !            28:  * All checks from RFC 4271 6.3 are done as specified with these exceptions:
        !            29:  *  - The semantic check of an IP address from NEXT_HOP attribute is missing.
        !            30:  *  - Checks of some optional attribute values are missing.
        !            31:  *  - Syntactic and semantic checks of NLRIs (done in DECODE_PREFIX())
        !            32:  *    are probably inadequate.
        !            33:  *
        !            34:  * Loop detection based on AS_PATH causes updates to be withdrawn. RFC
        !            35:  * 4271 does not explicitly specifiy the behavior in that case.
        !            36:  *
        !            37:  * Loop detection related to route reflection (based on ORIGINATOR_ID
        !            38:  * and CLUSTER_LIST) causes updates to be withdrawn. RFC 4456 8
        !            39:  * specifies that such updates should be ignored, but that is generally
        !            40:  * a bad idea.
        !            41:  *
        !            42:  * Error checking of optional transitive attributes is done according to
        !            43:  * draft-ietf-idr-optional-transitive-03, but errors are handled always
        !            44:  * as withdraws.
        !            45:  *
        !            46:  * Unexpected AS_CONFED_* segments in AS_PATH are logged and removed,
        !            47:  * but unknown segments cause a session drop with Malformed AS_PATH
        !            48:  * error (see validate_path()). The behavior in such case is not
        !            49:  * explicitly specified by RFC 4271. RFC 5065 specifies that
        !            50:  * inconsistent AS_CONFED_* segments should cause a session drop, but
        !            51:  * implementations that pass invalid AS_CONFED_* segments are
        !            52:  * widespread.
        !            53:  *
        !            54:  * Error handling of AS4_* attributes is done as specified by
        !            55:  * draft-ietf-idr-rfc4893bis-03. There are several possible
        !            56:  * inconsistencies between AGGREGATOR and AS4_AGGREGATOR that are not
        !            57:  * handled by that draft, these are logged and ignored (see
        !            58:  * bgp_reconstruct_4b_attrs()).
        !            59:  */
        !            60: 
        !            61: 
        !            62: static byte bgp_mandatory_attrs[] = { BA_ORIGIN, BA_AS_PATH
        !            63: #ifndef IPV6
        !            64: ,BA_NEXT_HOP
        !            65: #endif
        !            66: };
        !            67: 
        !            68: struct attr_desc {
        !            69:   char *name;
        !            70:   int expected_length;
        !            71:   int expected_flags;
        !            72:   int type;
        !            73:   int allow_in_ebgp;
        !            74:   int (*validate)(struct bgp_proto *p, byte *attr, int len);
        !            75:   void (*format)(eattr *ea, byte *buf, int buflen);
        !            76: };
        !            77: 
        !            78: #define IGNORE -1
        !            79: #define WITHDRAW -2
        !            80: 
        !            81: static int
        !            82: bgp_check_origin(struct bgp_proto *p UNUSED, byte *a, int len UNUSED)
        !            83: {
        !            84:   if (*a > 2)
        !            85:     return 6;
        !            86:   return 0;
        !            87: }
        !            88: 
        !            89: static void
        !            90: bgp_format_origin(eattr *a, byte *buf, int buflen UNUSED)
        !            91: {
        !            92:   static char *bgp_origin_names[] = { "IGP", "EGP", "Incomplete" };
        !            93: 
        !            94:   bsprintf(buf, bgp_origin_names[a->u.data]);
        !            95: }
        !            96: 
        !            97: static int
        !            98: path_segment_contains(byte *p, int bs, u32 asn)
        !            99: {
        !           100:   int i;
        !           101:   int len = p[1];
        !           102:   p += 2;
        !           103: 
        !           104:   for(i=0; i<len; i++)
        !           105:     {
        !           106:       u32 asn2 = (bs == 4) ? get_u32(p) : get_u16(p);
        !           107:       if (asn2 == asn)
        !           108:        return 1;
        !           109:       p += bs;
        !           110:     }
        !           111: 
        !           112:   return 0;
        !           113: }
        !           114: 
        !           115: /* Validates path attribute, removes AS_CONFED_* segments, and also returns path length */
        !           116: static int
        !           117: validate_path(struct bgp_proto *p, int as_path, int bs, byte *idata, uint *ilength)
        !           118: {
        !           119:   int res = 0;
        !           120:   u8 *a, *dst;
        !           121:   int len, plen;
        !           122: 
        !           123:   dst = a = idata;
        !           124:   len = *ilength;
        !           125: 
        !           126:   while (len)
        !           127:     {
        !           128:       if (len < 2)
        !           129:        return -1;
        !           130: 
        !           131:       plen = 2 + bs * a[1];
        !           132:       if (len < plen)
        !           133:        return -1;
        !           134: 
        !           135:       if (a[1] == 0)
        !           136:         {
        !           137:          log(L_WARN "%s: %s_PATH attribute contains empty segment, skipping it",
        !           138:              p->p.name, as_path ? "AS" : "AS4");
        !           139:          goto skip;
        !           140:        }
        !           141: 
        !           142:       switch (a[0])
        !           143:        {
        !           144:        case AS_PATH_SET:
        !           145:          res++;
        !           146:          break;
        !           147: 
        !           148:        case AS_PATH_SEQUENCE:
        !           149:          res += a[1];
        !           150:          break;
        !           151: 
        !           152:        case AS_PATH_CONFED_SEQUENCE:
        !           153:        case AS_PATH_CONFED_SET:
        !           154:          if (as_path && path_segment_contains(a, bs, p->remote_as))
        !           155:            {
        !           156:              log(L_WARN "%s: AS_CONFED_* segment with peer ASN found, misconfigured confederation?", p->p.name);
        !           157:              return -1;
        !           158:            }
        !           159: 
        !           160:          log(L_WARN "%s: %s_PATH attribute contains AS_CONFED_* segment, skipping segment",
        !           161:              p->p.name, as_path ? "AS" : "AS4");
        !           162:          goto skip;
        !           163: 
        !           164:        default:
        !           165:          return -1;
        !           166:        }
        !           167: 
        !           168:       if (dst != a)
        !           169:        memmove(dst, a, plen);
        !           170:       dst += plen;
        !           171: 
        !           172:     skip:
        !           173:       len -= plen;
        !           174:       a += plen;
        !           175:     }
        !           176: 
        !           177:   *ilength = dst - idata;
        !           178:   return res;
        !           179: }
        !           180: 
        !           181: static inline int
        !           182: validate_as_path(struct bgp_proto *p, byte *a, int *len)
        !           183: {
        !           184:   return validate_path(p, 1, p->as4_session ? 4 : 2, a, len);
        !           185: }
        !           186: 
        !           187: static inline int
        !           188: validate_as4_path(struct bgp_proto *p, struct adata *path)
        !           189: {
        !           190:   return validate_path(p, 0, 4, path->data, &path->length);
        !           191: }
        !           192: 
        !           193: static int
        !           194: bgp_check_next_hop(struct bgp_proto *p UNUSED, byte *a UNUSED6, int len UNUSED6)
        !           195: {
        !           196: #ifdef IPV6
        !           197:   return IGNORE;
        !           198: #else
        !           199:   ip_addr addr;
        !           200: 
        !           201:   memcpy(&addr, a, len);
        !           202:   ipa_ntoh(addr);
        !           203:   if (ipa_classify(addr) & IADDR_HOST)
        !           204:     return 0;
        !           205:   else
        !           206:     return 8;
        !           207: #endif
        !           208: }
        !           209: 
        !           210: static void
        !           211: bgp_format_next_hop(eattr *a, byte *buf, int buflen UNUSED)
        !           212: {
        !           213:   ip_addr *ipp = (ip_addr *) a->u.ptr->data;
        !           214: #ifdef IPV6
        !           215:   /* in IPv6, we might have two addresses in NEXT HOP */
        !           216:   if ((a->u.ptr->length == NEXT_HOP_LENGTH) && ipa_nonzero(ipp[1]))
        !           217:     {
        !           218:       bsprintf(buf, "%I %I", ipp[0], ipp[1]);
        !           219:       return;
        !           220:     }
        !           221: #endif
        !           222: 
        !           223:   bsprintf(buf, "%I", ipp[0]);
        !           224: }
        !           225: 
        !           226: static int
        !           227: bgp_check_aggregator(struct bgp_proto *p, byte *a UNUSED, int len)
        !           228: {
        !           229:   int exp_len = p->as4_session ? 8 : 6;
        !           230:   
        !           231:   return (len == exp_len) ? 0 : WITHDRAW;
        !           232: }
        !           233: 
        !           234: static void
        !           235: bgp_format_aggregator(eattr *a, byte *buf, int buflen UNUSED)
        !           236: {
        !           237:   struct adata *ad =  a->u.ptr;
        !           238:   byte *data = ad->data;
        !           239:   u32 as;
        !           240: 
        !           241:   as = get_u32(data);
        !           242:   data += 4;
        !           243: 
        !           244:   bsprintf(buf, "%d.%d.%d.%d AS%u", data[0], data[1], data[2], data[3], as);
        !           245: }
        !           246: 
        !           247: static int
        !           248: bgp_check_community(struct bgp_proto *p UNUSED, byte *a UNUSED, int len)
        !           249: {
        !           250:   return ((len % 4) == 0) ? 0 : WITHDRAW;
        !           251: }
        !           252: 
        !           253: static int
        !           254: bgp_check_cluster_list(struct bgp_proto *p UNUSED, byte *a UNUSED, int len)
        !           255: {
        !           256:   return ((len % 4) == 0) ? 0 : 5;
        !           257: }
        !           258: 
        !           259: static void
        !           260: bgp_format_cluster_list(eattr *a, byte *buf, int buflen)
        !           261: {
        !           262:   /* Truncates cluster lists larger than buflen, probably not a problem */
        !           263:   int_set_format(a->u.ptr, 0, -1, buf, buflen);
        !           264: }
        !           265: 
        !           266: static int
        !           267: bgp_check_reach_nlri(struct bgp_proto *p UNUSED, byte *a UNUSED, int len UNUSED)
        !           268: {
        !           269: #ifdef IPV6
        !           270:   p->mp_reach_start = a;
        !           271:   p->mp_reach_len = len;
        !           272: #endif
        !           273:   return IGNORE;
        !           274: }
        !           275: 
        !           276: static int
        !           277: bgp_check_unreach_nlri(struct bgp_proto *p UNUSED, byte *a UNUSED, int len UNUSED)
        !           278: {
        !           279: #ifdef IPV6
        !           280:   p->mp_unreach_start = a;
        !           281:   p->mp_unreach_len = len;
        !           282: #endif
        !           283:   return IGNORE;
        !           284: }
        !           285: 
        !           286: static int
        !           287: bgp_check_ext_community(struct bgp_proto *p UNUSED, byte *a UNUSED, int len)
        !           288: {
        !           289:   return ((len % 8) == 0) ? 0 : WITHDRAW;
        !           290: }
        !           291: 
        !           292: static int
        !           293: bgp_check_large_community(struct bgp_proto *p UNUSED, byte *a UNUSED, int len)
        !           294: {
        !           295:   return ((len % 12) == 0) ? 0 : WITHDRAW;
        !           296: }
        !           297: 
        !           298: 
        !           299: static struct attr_desc bgp_attr_table[] = {
        !           300:   { NULL, -1, 0, 0, 0,                                                         /* Undefined */
        !           301:     NULL, NULL },
        !           302:   { "origin", 1, BAF_TRANSITIVE, EAF_TYPE_INT, 1,                              /* BA_ORIGIN */
        !           303:     bgp_check_origin, bgp_format_origin },
        !           304:   { "as_path", -1, BAF_TRANSITIVE, EAF_TYPE_AS_PATH, 1,                                /* BA_AS_PATH */
        !           305:     NULL, NULL }, /* is checked by validate_as_path() as a special case */
        !           306:   { "next_hop", 4, BAF_TRANSITIVE, EAF_TYPE_IP_ADDRESS, 1,                     /* BA_NEXT_HOP */
        !           307:     bgp_check_next_hop, bgp_format_next_hop },
        !           308:   { "med", 4, BAF_OPTIONAL, EAF_TYPE_INT, 1,                                   /* BA_MULTI_EXIT_DISC */
        !           309:     NULL, NULL },
        !           310:   { "local_pref", 4, BAF_TRANSITIVE, EAF_TYPE_INT, 0,                          /* BA_LOCAL_PREF */
        !           311:     NULL, NULL },
        !           312:   { "atomic_aggr", 0, BAF_TRANSITIVE, EAF_TYPE_OPAQUE, 1,                      /* BA_ATOMIC_AGGR */
        !           313:     NULL, NULL },
        !           314:   { "aggregator", -1, BAF_OPTIONAL | BAF_TRANSITIVE, EAF_TYPE_OPAQUE, 1,       /* BA_AGGREGATOR */
        !           315:     bgp_check_aggregator, bgp_format_aggregator },
        !           316:   { "community", -1, BAF_OPTIONAL | BAF_TRANSITIVE, EAF_TYPE_INT_SET, 1,       /* BA_COMMUNITY */
        !           317:     bgp_check_community, NULL },
        !           318:   { "originator_id", 4, BAF_OPTIONAL, EAF_TYPE_ROUTER_ID, 0,                   /* BA_ORIGINATOR_ID */
        !           319:     NULL, NULL },
        !           320:   { "cluster_list", -1, BAF_OPTIONAL, EAF_TYPE_INT_SET, 0,                     /* BA_CLUSTER_LIST */
        !           321:     bgp_check_cluster_list, bgp_format_cluster_list }, 
        !           322:   { .name = NULL },                                                            /* BA_DPA */
        !           323:   { .name = NULL },                                                            /* BA_ADVERTISER */
        !           324:   { .name = NULL },                                                            /* BA_RCID_PATH */
        !           325:   { "mp_reach_nlri", -1, BAF_OPTIONAL, EAF_TYPE_OPAQUE, 1,                     /* BA_MP_REACH_NLRI */
        !           326:     bgp_check_reach_nlri, NULL },
        !           327:   { "mp_unreach_nlri", -1, BAF_OPTIONAL, EAF_TYPE_OPAQUE, 1,                   /* BA_MP_UNREACH_NLRI */
        !           328:     bgp_check_unreach_nlri, NULL },
        !           329:   { "ext_community", -1, BAF_OPTIONAL | BAF_TRANSITIVE, EAF_TYPE_EC_SET, 1,    /* BA_EXT_COMMUNITY */
        !           330:     bgp_check_ext_community, NULL },
        !           331:   { "as4_path", -1, BAF_OPTIONAL | BAF_TRANSITIVE, EAF_TYPE_OPAQUE, 1,         /* BA_AS4_PATH */
        !           332:     NULL, NULL },
        !           333:   { "as4_aggregator", -1, BAF_OPTIONAL | BAF_TRANSITIVE, EAF_TYPE_OPAQUE, 1,   /* BA_AS4_PATH */
        !           334:     NULL, NULL },
        !           335:   [BA_LARGE_COMMUNITY] =
        !           336:   { "large_community", -1, BAF_OPTIONAL | BAF_TRANSITIVE, EAF_TYPE_LC_SET, 1,
        !           337:     bgp_check_large_community, NULL }
        !           338: };
        !           339: 
        !           340: /* BA_AS4_PATH is type EAF_TYPE_OPAQUE and not type EAF_TYPE_AS_PATH.
        !           341:  * It does not matter as this attribute does not appear on routes in the routing table.
        !           342:  */
        !           343: 
        !           344: #define ATTR_KNOWN(code) ((code) < ARRAY_SIZE(bgp_attr_table) && bgp_attr_table[code].name)
        !           345: 
        !           346: static inline struct adata *
        !           347: bgp_alloc_adata(struct linpool *pool, unsigned len)
        !           348: {
        !           349:   struct adata *ad = lp_alloc(pool, sizeof(struct adata) + len);
        !           350:   ad->length = len;
        !           351:   return ad;
        !           352: }
        !           353: 
        !           354: static void
        !           355: bgp_set_attr(eattr *e, unsigned attr, uintptr_t val)
        !           356: {
        !           357:   ASSERT(ATTR_KNOWN(attr));
        !           358:   e->id = EA_CODE(EAP_BGP, attr);
        !           359:   e->type = bgp_attr_table[attr].type;
        !           360:   e->flags = bgp_attr_table[attr].expected_flags;
        !           361:   if (e->type & EAF_EMBEDDED)
        !           362:     e->u.data = val;
        !           363:   else
        !           364:     e->u.ptr = (struct adata *) val;
        !           365: }
        !           366: 
        !           367: static byte *
        !           368: bgp_set_attr_wa(eattr *e, struct linpool *pool, unsigned attr, unsigned len)
        !           369: {
        !           370:   struct adata *ad = bgp_alloc_adata(pool, len);
        !           371:   bgp_set_attr(e, attr, (uintptr_t) ad);
        !           372:   return ad->data;
        !           373: }
        !           374: 
        !           375: void
        !           376: bgp_attach_attr(ea_list **to, struct linpool *pool, unsigned attr, uintptr_t val)
        !           377: {
        !           378:   ea_list *a = lp_alloc(pool, sizeof(ea_list) + sizeof(eattr));
        !           379:   a->next = *to;
        !           380:   *to = a;
        !           381:   a->flags = EALF_SORTED;
        !           382:   a->count = 1;
        !           383:   bgp_set_attr(a->attrs, attr, val);
        !           384: }
        !           385: 
        !           386: byte *
        !           387: bgp_attach_attr_wa(ea_list **to, struct linpool *pool, unsigned attr, unsigned len)
        !           388: {
        !           389:   struct adata *ad = bgp_alloc_adata(pool, len);
        !           390:   bgp_attach_attr(to, pool, attr, (uintptr_t) ad);
        !           391:   return ad->data;
        !           392: }
        !           393: 
        !           394: static int
        !           395: bgp_encode_attr_hdr(byte *dst, uint flags, unsigned code, int len)
        !           396: {
        !           397:   int wlen;
        !           398: 
        !           399:   DBG("\tAttribute %02x (%d bytes, flags %02x)\n", code, len, flags);
        !           400: 
        !           401:   if (len < 256)
        !           402:     {
        !           403:       *dst++ = flags;
        !           404:       *dst++ = code;
        !           405:       *dst++ = len;
        !           406:       wlen = 3;
        !           407:     }
        !           408:   else
        !           409:     {
        !           410:       *dst++ = flags | BAF_EXT_LEN;
        !           411:       *dst++ = code;
        !           412:       put_u16(dst, len);
        !           413:       wlen = 4;
        !           414:     }
        !           415: 
        !           416:   return wlen;
        !           417: }
        !           418: 
        !           419: static void
        !           420: aggregator_convert_to_old(struct adata *aggr, byte *dst, int *new_used)
        !           421: {
        !           422:   byte *src = aggr->data;
        !           423:   *new_used = 0;
        !           424: 
        !           425:   u32 as = get_u32(src);
        !           426:   if (as > 0xFFFF) 
        !           427:     {
        !           428:       as = AS_TRANS;
        !           429:       *new_used = 1;
        !           430:     }
        !           431:   put_u16(dst, as);
        !           432: 
        !           433:   /* Copy IPv4 address */
        !           434:   memcpy(dst + 2, src + 4, 4);
        !           435: }
        !           436: 
        !           437: static void
        !           438: aggregator_convert_to_new(struct adata *aggr, byte *dst)
        !           439: {
        !           440:   byte *src = aggr->data;
        !           441: 
        !           442:   u32 as   = get_u16(src);
        !           443:   put_u32(dst, as);
        !           444: 
        !           445:   /* Copy IPv4 address */
        !           446:   memcpy(dst + 4, src + 2, 4);
        !           447: }
        !           448: 
        !           449: static int
        !           450: bgp_get_attr_len(eattr *a)
        !           451: {
        !           452:   int len;
        !           453:   if (ATTR_KNOWN(EA_ID(a->id)))
        !           454:     {
        !           455:       int code = EA_ID(a->id);
        !           456:       struct attr_desc *desc = &bgp_attr_table[code];
        !           457:       len = desc->expected_length;
        !           458:       if (len < 0)
        !           459:        {
        !           460:          ASSERT(!(a->type & EAF_EMBEDDED));
        !           461:          len = a->u.ptr->length;
        !           462:        }
        !           463:     }
        !           464:   else
        !           465:     {
        !           466:       ASSERT((a->type & EAF_TYPE_MASK) == EAF_TYPE_OPAQUE);
        !           467:       len = a->u.ptr->length;
        !           468:     }
        !           469:   
        !           470:   return len;
        !           471: }
        !           472: 
        !           473: #define ADVANCE(w, r, l) do { r -= l; w += l; } while (0)
        !           474: 
        !           475: /**
        !           476:  * bgp_encode_attrs - encode BGP attributes
        !           477:  * @p: BGP instance
        !           478:  * @w: buffer
        !           479:  * @attrs: a list of extended attributes
        !           480:  * @remains: remaining space in the buffer
        !           481:  *
        !           482:  * The bgp_encode_attrs() function takes a list of extended attributes
        !           483:  * and converts it to its BGP representation (a part of an Update message).
        !           484:  *
        !           485:  * Result: Length of the attribute block generated or -1 if not enough space.
        !           486:  */
        !           487: uint
        !           488: bgp_encode_attrs(struct bgp_proto *p, byte *w, ea_list *attrs, int remains)
        !           489: {
        !           490:   uint i, code, type, flags;
        !           491:   byte *start = w;
        !           492:   int len, rv;
        !           493: 
        !           494:   for(i=0; i<attrs->count; i++)
        !           495:     {
        !           496:       eattr *a = &attrs->attrs[i];
        !           497:       ASSERT(EA_PROTO(a->id) == EAP_BGP);
        !           498:       code = EA_ID(a->id);
        !           499: 
        !           500: #ifdef IPV6
        !           501:       /* When talking multiprotocol BGP, the NEXT_HOP attributes are used only temporarily. */
        !           502:       if (code == BA_NEXT_HOP)
        !           503:        continue;
        !           504: #endif
        !           505: 
        !           506:       /* When AS4-aware BGP speaker is talking to non-AS4-aware BGP speaker,
        !           507:        * we have to convert our 4B AS_PATH to 2B AS_PATH and send our AS_PATH 
        !           508:        * as optional AS4_PATH attribute.
        !           509:        */
        !           510:       if ((code == BA_AS_PATH) && (! p->as4_session))
        !           511:        {
        !           512:          len = a->u.ptr->length;
        !           513: 
        !           514:          if (remains < (len + 4))
        !           515:            goto err_no_buffer;
        !           516: 
        !           517:          /* Using temporary buffer because don't know a length of created attr
        !           518:           * and therefore a length of a header. Perhaps i should better always
        !           519:           * use BAF_EXT_LEN. */
        !           520:          
        !           521:          byte buf[len];
        !           522:          int new_used;
        !           523:          int nl = as_path_convert_to_old(a->u.ptr, buf, &new_used);
        !           524: 
        !           525:          DBG("BGP: Encoding old AS_PATH\n");
        !           526:          rv = bgp_encode_attr_hdr(w, BAF_TRANSITIVE, BA_AS_PATH, nl);
        !           527:          ADVANCE(w, remains, rv);
        !           528:          memcpy(w, buf, nl);
        !           529:          ADVANCE(w, remains, nl);
        !           530: 
        !           531:          if (! new_used)
        !           532:            continue;
        !           533: 
        !           534:          if (remains < (len + 4))
        !           535:            goto err_no_buffer;
        !           536: 
        !           537:          /* We should discard AS_CONFED_SEQUENCE or AS_CONFED_SET path segments 
        !           538:           * here but we don't support confederations and such paths we already
        !           539:           * discarded in bgp_check_as_path().
        !           540:           */
        !           541: 
        !           542:          DBG("BGP: Encoding AS4_PATH\n");
        !           543:          rv = bgp_encode_attr_hdr(w, BAF_OPTIONAL | BAF_TRANSITIVE, BA_AS4_PATH, len);
        !           544:          ADVANCE(w, remains, rv);
        !           545:          memcpy(w, a->u.ptr->data, len);
        !           546:          ADVANCE(w, remains, len);
        !           547: 
        !           548:          continue;
        !           549:        }
        !           550: 
        !           551:       /* The same issue with AGGREGATOR attribute */
        !           552:       if ((code == BA_AGGREGATOR) && (! p->as4_session))
        !           553:        {
        !           554:          int new_used;
        !           555: 
        !           556:          len = 6;
        !           557:          if (remains < (len + 3))
        !           558:            goto err_no_buffer;
        !           559: 
        !           560:          rv = bgp_encode_attr_hdr(w, BAF_OPTIONAL | BAF_TRANSITIVE, BA_AGGREGATOR, len);
        !           561:          ADVANCE(w, remains, rv);
        !           562:          aggregator_convert_to_old(a->u.ptr, w, &new_used);
        !           563:          ADVANCE(w, remains, len);
        !           564: 
        !           565:          if (! new_used)
        !           566:            continue;
        !           567: 
        !           568:          len = 8;
        !           569:          if (remains < (len + 3))
        !           570:            goto err_no_buffer;
        !           571: 
        !           572:          rv = bgp_encode_attr_hdr(w, BAF_OPTIONAL | BAF_TRANSITIVE, BA_AS4_AGGREGATOR, len);
        !           573:          ADVANCE(w, remains, rv);
        !           574:          memcpy(w, a->u.ptr->data, len);
        !           575:          ADVANCE(w, remains, len);
        !           576: 
        !           577:          continue;
        !           578:        }
        !           579: 
        !           580:       /* Standard path continues here ... */
        !           581: 
        !           582:       type = a->type & EAF_TYPE_MASK;
        !           583:       flags = a->flags & (BAF_OPTIONAL | BAF_TRANSITIVE | BAF_PARTIAL);
        !           584:       len = bgp_get_attr_len(a);
        !           585: 
        !           586:       /* Skip empty sets */ 
        !           587:       if (((type == EAF_TYPE_INT_SET) || (type == EAF_TYPE_EC_SET) || (type == EAF_TYPE_LC_SET)) && (len == 0))
        !           588:        continue; 
        !           589: 
        !           590:       if (remains < len + 4)
        !           591:        goto err_no_buffer;
        !           592: 
        !           593:       rv = bgp_encode_attr_hdr(w, flags, code, len);
        !           594:       ADVANCE(w, remains, rv);
        !           595: 
        !           596:       switch (type)
        !           597:        {
        !           598:        case EAF_TYPE_INT:
        !           599:        case EAF_TYPE_ROUTER_ID:
        !           600:          if (len == 4)
        !           601:            put_u32(w, a->u.data);
        !           602:          else
        !           603:            *w = a->u.data;
        !           604:          break;
        !           605:        case EAF_TYPE_IP_ADDRESS:
        !           606:          {
        !           607:            ip_addr ip = *(ip_addr *)a->u.ptr->data;
        !           608:            ipa_hton(ip);
        !           609:            memcpy(w, &ip, len);
        !           610:            break;
        !           611:          }
        !           612:        case EAF_TYPE_INT_SET:
        !           613:        case EAF_TYPE_LC_SET:
        !           614:        case EAF_TYPE_EC_SET:
        !           615:          {
        !           616:            u32 *z = int_set_get_data(a->u.ptr);
        !           617:            int i;
        !           618:            for(i=0; i<len; i+=4)
        !           619:              put_u32(w+i, *z++);
        !           620:            break;
        !           621:          }
        !           622:        case EAF_TYPE_OPAQUE:
        !           623:        case EAF_TYPE_AS_PATH:
        !           624:          memcpy(w, a->u.ptr->data, len);
        !           625:          break;
        !           626:        default:
        !           627:          bug("bgp_encode_attrs: unknown attribute type %02x", a->type);
        !           628:        }
        !           629:       ADVANCE(w, remains, len);
        !           630:     }
        !           631:   return w - start;
        !           632: 
        !           633:  err_no_buffer:
        !           634:   return -1;
        !           635: }
        !           636: 
        !           637: /*
        !           638: static void
        !           639: bgp_init_prefix(struct fib_node *N)
        !           640: {
        !           641:   struct bgp_prefix *p = (struct bgp_prefix *) N;
        !           642:   p->bucket_node.next = NULL;
        !           643: }
        !           644: */
        !           645: 
        !           646: static int
        !           647: bgp_compare_u32(const u32 *x, const u32 *y)
        !           648: {
        !           649:   return (*x < *y) ? -1 : (*x > *y) ? 1 : 0;
        !           650: }
        !           651: 
        !           652: static inline void
        !           653: bgp_normalize_int_set(u32 *dest, u32 *src, unsigned cnt)
        !           654: {
        !           655:   memcpy(dest, src, sizeof(u32) * cnt);
        !           656:   qsort(dest, cnt, sizeof(u32), (int(*)(const void *, const void *)) bgp_compare_u32);
        !           657: }
        !           658: 
        !           659: static int
        !           660: bgp_compare_ec(const u32 *xp, const u32 *yp)
        !           661: {
        !           662:   u64 x = ec_get(xp, 0);
        !           663:   u64 y = ec_get(yp, 0);
        !           664:   return (x < y) ? -1 : (x > y) ? 1 : 0;
        !           665: }
        !           666: 
        !           667: static inline void
        !           668: bgp_normalize_ec_set(struct adata *ad, u32 *src, int internal)
        !           669: {
        !           670:   u32 *dst = int_set_get_data(ad);
        !           671: 
        !           672:   /* Remove non-transitive communities (EC_TBIT active) on external sessions */
        !           673:   if (! internal)
        !           674:     {
        !           675:       int len = int_set_get_size(ad);
        !           676:       u32 *t = dst;
        !           677:       int i;
        !           678: 
        !           679:       for (i=0; i < len; i += 2)
        !           680:        {
        !           681:          if (src[i] & EC_TBIT)
        !           682:            continue;
        !           683:          
        !           684:          *t++ = src[i];
        !           685:          *t++ = src[i+1];
        !           686:        }
        !           687: 
        !           688:       ad->length = (t - dst) * 4;
        !           689:     }
        !           690:   else
        !           691:     memcpy(dst, src, ad->length);
        !           692: 
        !           693:   qsort(dst, ad->length / 8, 8, (int(*)(const void *, const void *)) bgp_compare_ec);
        !           694: }
        !           695: 
        !           696: static int
        !           697: bgp_compare_lc(const u32 *x, const u32 *y)
        !           698: {
        !           699:   if (x[0] != y[0])
        !           700:     return (x[0] > y[0]) ? 1 : -1;
        !           701:   if (x[1] != y[1])
        !           702:     return (x[1] > y[1]) ? 1 : -1;
        !           703:   if (x[2] != y[2])
        !           704:     return (x[2] > y[2]) ? 1 : -1;
        !           705:   return 0;
        !           706: }
        !           707: 
        !           708: static inline void
        !           709: bgp_normalize_lc_set(u32 *dest, u32 *src, unsigned cnt)
        !           710: {
        !           711:   memcpy(dest, src, LCOMM_LENGTH * cnt);
        !           712:   qsort(dest, cnt, LCOMM_LENGTH, (int(*)(const void *, const void *)) bgp_compare_lc);
        !           713: }
        !           714: 
        !           715: static void
        !           716: bgp_rehash_buckets(struct bgp_proto *p)
        !           717: {
        !           718:   struct bgp_bucket **old = p->bucket_hash;
        !           719:   struct bgp_bucket **new;
        !           720:   unsigned oldn = p->hash_size;
        !           721:   unsigned i, e, mask;
        !           722:   struct bgp_bucket *b;
        !           723: 
        !           724:   p->hash_size = p->hash_limit;
        !           725:   DBG("BGP: Rehashing bucket table from %d to %d\n", oldn, p->hash_size);
        !           726:   p->hash_limit *= 4;
        !           727:   if (p->hash_limit >= 65536)
        !           728:     p->hash_limit = ~0;
        !           729:   new = p->bucket_hash = mb_allocz(p->p.pool, p->hash_size * sizeof(struct bgp_bucket *));
        !           730:   mask = p->hash_size - 1;
        !           731:   for (i=0; i<oldn; i++)
        !           732:     while (b = old[i])
        !           733:       {
        !           734:        old[i] = b->hash_next;
        !           735:        e = b->hash & mask;
        !           736:        b->hash_next = new[e];
        !           737:        if (b->hash_next)
        !           738:          b->hash_next->hash_prev = b;
        !           739:        b->hash_prev = NULL;
        !           740:        new[e] = b;
        !           741:       }
        !           742:   mb_free(old);
        !           743: }
        !           744: 
        !           745: static struct bgp_bucket *
        !           746: bgp_new_bucket(struct bgp_proto *p, ea_list *new, unsigned hash)
        !           747: {
        !           748:   struct bgp_bucket *b;
        !           749:   unsigned ea_size = sizeof(ea_list) + new->count * sizeof(eattr);
        !           750:   unsigned ea_size_aligned = BIRD_ALIGN(ea_size, CPU_STRUCT_ALIGN);
        !           751:   unsigned size = sizeof(struct bgp_bucket) + ea_size_aligned;
        !           752:   unsigned i;
        !           753:   byte *dest;
        !           754:   unsigned index = hash & (p->hash_size - 1);
        !           755: 
        !           756:   /* Gather total size of non-inline attributes */
        !           757:   for (i=0; i<new->count; i++)
        !           758:     {
        !           759:       eattr *a = &new->attrs[i];
        !           760:       if (!(a->type & EAF_EMBEDDED))
        !           761:        size += BIRD_ALIGN(sizeof(struct adata) + a->u.ptr->length, CPU_STRUCT_ALIGN);
        !           762:     }
        !           763: 
        !           764:   /* Create the bucket and hash it */
        !           765:   b = mb_alloc(p->p.pool, size);
        !           766:   b->hash_next = p->bucket_hash[index];
        !           767:   if (b->hash_next)
        !           768:     b->hash_next->hash_prev = b;
        !           769:   p->bucket_hash[index] = b;
        !           770:   b->hash_prev = NULL;
        !           771:   b->hash = hash;
        !           772:   add_tail(&p->bucket_queue, &b->send_node);
        !           773:   init_list(&b->prefixes);
        !           774:   memcpy(b->eattrs, new, ea_size);
        !           775:   dest = ((byte *)b->eattrs) + ea_size_aligned;
        !           776: 
        !           777:   /* Copy values of non-inline attributes */
        !           778:   for (i=0; i<new->count; i++)
        !           779:     {
        !           780:       eattr *a = &b->eattrs->attrs[i];
        !           781:       if (!(a->type & EAF_EMBEDDED))
        !           782:        {
        !           783:          struct adata *oa = a->u.ptr;
        !           784:          struct adata *na = (struct adata *) dest;
        !           785:          memcpy(na, oa, sizeof(struct adata) + oa->length);
        !           786:          a->u.ptr = na;
        !           787:          dest += BIRD_ALIGN(sizeof(struct adata) + na->length, CPU_STRUCT_ALIGN);
        !           788:        }
        !           789:     }
        !           790: 
        !           791:   /* If needed, rehash */
        !           792:   p->hash_count++;
        !           793:   if (p->hash_count > p->hash_limit)
        !           794:     bgp_rehash_buckets(p);
        !           795: 
        !           796:   return b;
        !           797: }
        !           798: 
        !           799: static struct bgp_bucket *
        !           800: bgp_get_bucket(struct bgp_proto *p, net *n, ea_list *attrs, int originate)
        !           801: {
        !           802:   ea_list *new;
        !           803:   unsigned i, cnt, hash, code;
        !           804:   eattr *a, *d;
        !           805:   u32 seen = 0;
        !           806:   struct bgp_bucket *b;
        !           807: 
        !           808:   /* Merge the attribute list */
        !           809:   new = alloca(ea_scan(attrs));
        !           810:   ea_merge(attrs, new);
        !           811:   ea_sort(new);
        !           812: 
        !           813:   /* Normalize attributes */
        !           814:   d = new->attrs;
        !           815:   cnt = new->count;
        !           816:   new->count = 0;
        !           817:   for(i=0; i<cnt; i++)
        !           818:     {
        !           819:       a = &new->attrs[i];
        !           820:       if (EA_PROTO(a->id) != EAP_BGP)
        !           821:        continue;
        !           822:       code = EA_ID(a->id);
        !           823:       if (ATTR_KNOWN(code))
        !           824:        {
        !           825:          if (!bgp_attr_table[code].allow_in_ebgp && !p->is_internal)
        !           826:            continue;
        !           827:          /* The flags might have been zero if the attr was added by filters */
        !           828:          a->flags = (a->flags & BAF_PARTIAL) | bgp_attr_table[code].expected_flags;
        !           829:          if (code < 32)
        !           830:            seen |= 1 << code;
        !           831:        }
        !           832:       else
        !           833:        {
        !           834:          /* Don't re-export unknown non-transitive attributes */
        !           835:          if (!(a->flags & BAF_TRANSITIVE))
        !           836:            continue;
        !           837:        }
        !           838:       *d = *a;
        !           839:       if ((d->type & EAF_ORIGINATED) && !originate && (d->flags & BAF_TRANSITIVE) && (d->flags & BAF_OPTIONAL))
        !           840:        d->flags |= BAF_PARTIAL;
        !           841:       switch (d->type & EAF_TYPE_MASK)
        !           842:        {
        !           843:        case EAF_TYPE_INT_SET:
        !           844:          {
        !           845:            struct adata *z = alloca(sizeof(struct adata) + d->u.ptr->length);
        !           846:            z->length = d->u.ptr->length;
        !           847:            bgp_normalize_int_set((u32 *) z->data, (u32 *) d->u.ptr->data, z->length / 4);
        !           848:            d->u.ptr = z;
        !           849:            break;
        !           850:          }
        !           851:        case EAF_TYPE_EC_SET:
        !           852:          {
        !           853:            struct adata *z = alloca(sizeof(struct adata) + d->u.ptr->length);
        !           854:            z->length = d->u.ptr->length;
        !           855:            bgp_normalize_ec_set(z, (u32 *) d->u.ptr->data, p->is_internal);
        !           856:            d->u.ptr = z;
        !           857:            break;
        !           858:          }
        !           859:        case EAF_TYPE_LC_SET:
        !           860:          {
        !           861:            struct adata *z = alloca(sizeof(struct adata) + d->u.ptr->length);
        !           862:            z->length = d->u.ptr->length;
        !           863:            bgp_normalize_lc_set((u32 *) z->data, (u32 *) d->u.ptr->data, z->length / LCOMM_LENGTH);
        !           864:            d->u.ptr = z;
        !           865:            break;
        !           866:          }
        !           867:        default: ;
        !           868:        }
        !           869:       d++;
        !           870:       new->count++;
        !           871:     }
        !           872: 
        !           873:   /* Hash */
        !           874:   hash = ea_hash(new);
        !           875:   for(b=p->bucket_hash[hash & (p->hash_size - 1)]; b; b=b->hash_next)
        !           876:     if (b->hash == hash && ea_same(b->eattrs, new))
        !           877:       {
        !           878:        DBG("Found bucket.\n");
        !           879:        return b;
        !           880:       }
        !           881: 
        !           882:   /* Ensure that there are all mandatory attributes */
        !           883:   for(i=0; i<ARRAY_SIZE(bgp_mandatory_attrs); i++)
        !           884:     if (!(seen & (1 << bgp_mandatory_attrs[i])))
        !           885:       {
        !           886:        log(L_ERR "%s: Mandatory attribute %s missing in route %I/%d", p->p.name, bgp_attr_table[bgp_mandatory_attrs[i]].name, n->n.prefix, n->n.pxlen);
        !           887:        return NULL;
        !           888:       }
        !           889: 
        !           890:   /* Check if next hop is valid */
        !           891:   a = ea_find(new, EA_CODE(EAP_BGP, BA_NEXT_HOP));
        !           892:   if (!a || ipa_equal(p->cf->remote_ip, *(ip_addr *)a->u.ptr->data))
        !           893:     {
        !           894:       log(L_ERR "%s: Invalid NEXT_HOP attribute in route %I/%d", p->p.name, n->n.prefix, n->n.pxlen);
        !           895:       return NULL;
        !           896:     }
        !           897: 
        !           898:   /* Create new bucket */
        !           899:   DBG("Creating bucket.\n");
        !           900:   return bgp_new_bucket(p, new, hash);
        !           901: }
        !           902: 
        !           903: void
        !           904: bgp_free_bucket(struct bgp_proto *p, struct bgp_bucket *buck)
        !           905: {
        !           906:   if (buck->hash_next)
        !           907:     buck->hash_next->hash_prev = buck->hash_prev;
        !           908:   if (buck->hash_prev)
        !           909:     buck->hash_prev->hash_next = buck->hash_next;
        !           910:   else
        !           911:     p->bucket_hash[buck->hash & (p->hash_size-1)] = buck->hash_next;
        !           912:   mb_free(buck);
        !           913: }
        !           914: 
        !           915: 
        !           916: /* Prefix hash table */
        !           917: 
        !           918: #define PXH_KEY(n1)            n1->n.prefix, n1->n.pxlen, n1->path_id
        !           919: #define PXH_NEXT(n)            n->next
        !           920: #define PXH_EQ(p1,l1,i1,p2,l2,i2) ipa_equal(p1, p2) && l1 == l2 && i1 == i2
        !           921: #define PXH_FN(p,l,i)          ipa_hash32(p) ^ u32_hash((l << 16) ^ i)
        !           922: 
        !           923: #define PXH_REHASH             bgp_pxh_rehash
        !           924: #define PXH_PARAMS             /8, *2, 2, 2, 8, 20
        !           925: 
        !           926: 
        !           927: HASH_DEFINE_REHASH_FN(PXH, struct bgp_prefix)
        !           928: 
        !           929: void
        !           930: bgp_init_prefix_table(struct bgp_proto *p, u32 order)
        !           931: {
        !           932:   HASH_INIT(p->prefix_hash, p->p.pool, order);
        !           933: 
        !           934:   p->prefix_slab = sl_new(p->p.pool, sizeof(struct bgp_prefix));
        !           935: }
        !           936: 
        !           937: void
        !           938: bgp_free_prefix_table(struct bgp_proto *p)
        !           939: {
        !           940:   HASH_FREE(p->prefix_hash);
        !           941: 
        !           942:   rfree(p->prefix_slab);
        !           943:   p->prefix_slab = NULL;
        !           944: }
        !           945: 
        !           946: static struct bgp_prefix *
        !           947: bgp_get_prefix(struct bgp_proto *p, ip_addr prefix, int pxlen, u32 path_id)
        !           948: {
        !           949:   struct bgp_prefix *bp = HASH_FIND(p->prefix_hash, PXH, prefix, pxlen, path_id);
        !           950: 
        !           951:   if (bp)
        !           952:     return bp;
        !           953: 
        !           954:   bp = sl_alloc(p->prefix_slab);
        !           955:   bp->n.prefix = prefix;
        !           956:   bp->n.pxlen = pxlen;
        !           957:   bp->path_id = path_id;
        !           958:   bp->bucket_node.next = NULL;
        !           959: 
        !           960:   HASH_INSERT2(p->prefix_hash, PXH, p->p.pool, bp);
        !           961: 
        !           962:   return bp;
        !           963: }
        !           964: 
        !           965: void
        !           966: bgp_free_prefix(struct bgp_proto *p, struct bgp_prefix *bp)
        !           967: {
        !           968:   HASH_REMOVE2(p->prefix_hash, PXH, p->p.pool, bp);
        !           969:   sl_free(p->prefix_slab, bp);
        !           970: }
        !           971: 
        !           972: 
        !           973: void
        !           974: bgp_rt_notify(struct proto *P, rtable *tbl UNUSED, net *n, rte *new, rte *old UNUSED, ea_list *attrs)
        !           975: {
        !           976:   struct bgp_proto *p = (struct bgp_proto *) P;
        !           977:   struct bgp_bucket *buck;
        !           978:   struct bgp_prefix *px;
        !           979:   rte *key;
        !           980:   u32 path_id;
        !           981: 
        !           982:   DBG("BGP: Got route %I/%d %s\n", n->n.prefix, n->n.pxlen, new ? "up" : "down");
        !           983: 
        !           984:   if (new)
        !           985:     {
        !           986:       key = new;
        !           987:       buck = bgp_get_bucket(p, n, attrs, new->attrs->source != RTS_BGP);
        !           988:       if (!buck)                       /* Inconsistent attribute list */
        !           989:        return;
        !           990:     }
        !           991:   else
        !           992:     {
        !           993:       key = old;
        !           994:       if (!(buck = p->withdraw_bucket))
        !           995:        {
        !           996:          buck = p->withdraw_bucket = mb_alloc(P->pool, sizeof(struct bgp_bucket));
        !           997:          init_list(&buck->prefixes);
        !           998:        }
        !           999:     }
        !          1000:   path_id = p->add_path_tx ? key->attrs->src->global_id : 0;
        !          1001:   px = bgp_get_prefix(p, n->n.prefix, n->n.pxlen, path_id);
        !          1002:   if (px->bucket_node.next)
        !          1003:     {
        !          1004:       DBG("\tRemoving old entry.\n");
        !          1005:       rem_node(&px->bucket_node);
        !          1006:     }
        !          1007:   add_tail(&buck->prefixes, &px->bucket_node);
        !          1008:   bgp_schedule_packet(p->conn, PKT_UPDATE);
        !          1009: }
        !          1010: 
        !          1011: static int
        !          1012: bgp_create_attrs(struct bgp_proto *p, rte *e, ea_list **attrs, struct linpool *pool)
        !          1013: {
        !          1014:   ea_list *ea = lp_alloc(pool, sizeof(ea_list) + 4*sizeof(eattr));
        !          1015:   rta *rta = e->attrs;
        !          1016:   byte *z;
        !          1017: 
        !          1018:   ea->next = *attrs;
        !          1019:   *attrs = ea;
        !          1020:   ea->flags = EALF_SORTED;
        !          1021:   ea->count = 4;
        !          1022: 
        !          1023:   bgp_set_attr(ea->attrs, BA_ORIGIN,
        !          1024:        ((rta->source == RTS_OSPF_EXT1) || (rta->source == RTS_OSPF_EXT2)) ? ORIGIN_INCOMPLETE : ORIGIN_IGP);
        !          1025: 
        !          1026:   if (p->is_internal)
        !          1027:     bgp_set_attr_wa(ea->attrs+1, pool, BA_AS_PATH, 0);
        !          1028:   else
        !          1029:     {
        !          1030:       z = bgp_set_attr_wa(ea->attrs+1, pool, BA_AS_PATH, 6);
        !          1031:       z[0] = AS_PATH_SEQUENCE;
        !          1032:       z[1] = 1;                                /* 1 AS */
        !          1033:       put_u32(z+2, p->local_as);
        !          1034:     }
        !          1035: 
        !          1036:   /* iBGP -> use gw, eBGP multi-hop -> use source_addr,
        !          1037:      eBGP single-hop -> use gw if on the same iface */
        !          1038:   z = bgp_set_attr_wa(ea->attrs+2, pool, BA_NEXT_HOP, NEXT_HOP_LENGTH);
        !          1039:   if (p->cf->next_hop_self ||
        !          1040:       rta->dest != RTD_ROUTER ||
        !          1041:       ipa_equal(rta->gw, IPA_NONE) ||
        !          1042:       ipa_is_link_local(rta->gw) ||
        !          1043:       (!p->is_internal && !p->cf->next_hop_keep &&
        !          1044:        (!p->neigh || (rta->iface != p->neigh->iface))))
        !          1045:     set_next_hop(z, p->source_addr);
        !          1046:   else
        !          1047:     set_next_hop(z, rta->gw);
        !          1048: 
        !          1049:   bgp_set_attr(ea->attrs+3, BA_LOCAL_PREF, p->cf->default_local_pref);
        !          1050: 
        !          1051:   return 0;                            /* Leave decision to the filters */
        !          1052: }
        !          1053: 
        !          1054: 
        !          1055: static inline int
        !          1056: bgp_as_path_loopy(struct bgp_proto *p, rta *a)
        !          1057: {
        !          1058:   int num = p->cf->allow_local_as + 1;
        !          1059:   eattr *e = ea_find(a->eattrs, EA_CODE(EAP_BGP, BA_AS_PATH));
        !          1060:   return (e && (num > 0) && as_path_contains(e->u.ptr, p->local_as, num));
        !          1061: }
        !          1062: 
        !          1063: static inline int
        !          1064: bgp_originator_id_loopy(struct bgp_proto *p, rta *a)
        !          1065: {
        !          1066:   eattr *e = ea_find(a->eattrs, EA_CODE(EAP_BGP, BA_ORIGINATOR_ID));
        !          1067:   return (e && (e->u.data == p->local_id));
        !          1068: }
        !          1069: 
        !          1070: static inline int
        !          1071: bgp_cluster_list_loopy(struct bgp_proto *p, rta *a)
        !          1072: {
        !          1073:   eattr *e = ea_find(a->eattrs, EA_CODE(EAP_BGP, BA_CLUSTER_LIST));
        !          1074:   return (e && p->rr_client && int_set_contains(e->u.ptr, p->rr_cluster_id));
        !          1075: }
        !          1076: 
        !          1077: 
        !          1078: static inline void
        !          1079: bgp_path_prepend(rte *e, ea_list **attrs, struct linpool *pool, u32 as)
        !          1080: {
        !          1081:   eattr *a = ea_find(e->attrs->eattrs, EA_CODE(EAP_BGP, BA_AS_PATH));
        !          1082:   bgp_attach_attr(attrs, pool, BA_AS_PATH, (uintptr_t) as_path_prepend(pool, a->u.ptr, as));
        !          1083: }
        !          1084: 
        !          1085: static inline void
        !          1086: bgp_cluster_list_prepend(rte *e, ea_list **attrs, struct linpool *pool, u32 cid)
        !          1087: {
        !          1088:   eattr *a = ea_find(e->attrs->eattrs, EA_CODE(EAP_BGP, BA_CLUSTER_LIST));
        !          1089:   bgp_attach_attr(attrs, pool, BA_CLUSTER_LIST, (uintptr_t) int_set_prepend(pool, a ? a->u.ptr : NULL, cid));
        !          1090: }
        !          1091: 
        !          1092: static int
        !          1093: bgp_update_attrs(struct bgp_proto *p, rte *e, ea_list **attrs, struct linpool *pool, int rr)
        !          1094: {
        !          1095:   eattr *a;
        !          1096: 
        !          1097:   if (!p->is_internal && !p->rs_client)
        !          1098:     {
        !          1099:       bgp_path_prepend(e, attrs, pool, p->local_as);
        !          1100: 
        !          1101:       /* The MULTI_EXIT_DISC attribute received from a neighboring AS MUST NOT be
        !          1102:        * propagated to other neighboring ASes.
        !          1103:        * Perhaps it would be better to undefine it.
        !          1104:        */
        !          1105:       a = ea_find(e->attrs->eattrs, EA_CODE(EAP_BGP, BA_MULTI_EXIT_DISC));
        !          1106:       if (a)
        !          1107:        bgp_attach_attr(attrs, pool, BA_MULTI_EXIT_DISC, 0);
        !          1108:     }
        !          1109: 
        !          1110:   /* iBGP -> keep next_hop, eBGP multi-hop -> use source_addr,
        !          1111:    * eBGP single-hop -> keep next_hop if on the same iface.
        !          1112:    * If the next_hop is zero (i.e. link-local), keep only if on the same iface.
        !          1113:    *
        !          1114:    * Note that same-iface-check uses iface from route, which is based on gw.
        !          1115:    */
        !          1116:   a = ea_find(e->attrs->eattrs, EA_CODE(EAP_BGP, BA_NEXT_HOP));
        !          1117:   if (a && !p->cf->next_hop_self && 
        !          1118:       (p->cf->next_hop_keep ||
        !          1119:        (p->is_internal && ipa_nonzero(*((ip_addr *) a->u.ptr->data))) ||
        !          1120:        (p->neigh && (e->attrs->iface == p->neigh->iface))))
        !          1121:     {
        !          1122:       /* Leave the original next hop attribute, will check later where does it point */
        !          1123:     }
        !          1124:   else
        !          1125:     {
        !          1126:       /* Need to create new one */
        !          1127:       byte *b = bgp_attach_attr_wa(attrs, pool, BA_NEXT_HOP, NEXT_HOP_LENGTH);
        !          1128:       set_next_hop(b, p->source_addr);
        !          1129:     }
        !          1130: 
        !          1131:   if (rr)
        !          1132:     {
        !          1133:       /* Handling route reflection, RFC 4456 */
        !          1134:       struct bgp_proto *src = (struct bgp_proto *) e->attrs->src->proto;
        !          1135: 
        !          1136:       a = ea_find(e->attrs->eattrs, EA_CODE(EAP_BGP, BA_ORIGINATOR_ID));
        !          1137:       if (!a)
        !          1138:        bgp_attach_attr(attrs, pool, BA_ORIGINATOR_ID, src->remote_id);
        !          1139: 
        !          1140:       /* We attach proper cluster ID according to whether the route is entering or leaving the cluster */
        !          1141:       bgp_cluster_list_prepend(e, attrs, pool, src->rr_client ? src->rr_cluster_id : p->rr_cluster_id);
        !          1142: 
        !          1143:       /* Two RR clients with different cluster ID, hmmm */
        !          1144:       if (src->rr_client && p->rr_client && (src->rr_cluster_id != p->rr_cluster_id))
        !          1145:        bgp_cluster_list_prepend(e, attrs, pool, p->rr_cluster_id);
        !          1146:     }
        !          1147: 
        !          1148:   return 0;                            /* Leave decision to the filters */
        !          1149: }
        !          1150: 
        !          1151: static int
        !          1152: bgp_community_filter(struct bgp_proto *p, rte *e)
        !          1153: {
        !          1154:   eattr *a;
        !          1155:   struct adata *d;
        !          1156: 
        !          1157:   /* Check if we aren't forbidden to export the route by communities */
        !          1158:   a = ea_find(e->attrs->eattrs, EA_CODE(EAP_BGP, BA_COMMUNITY));
        !          1159:   if (a)
        !          1160:     {
        !          1161:       d = a->u.ptr;
        !          1162:       if (int_set_contains(d, BGP_COMM_NO_ADVERTISE))
        !          1163:        {
        !          1164:          DBG("\tNO_ADVERTISE\n");
        !          1165:          return 1;
        !          1166:        }
        !          1167:       if (!p->is_internal &&
        !          1168:          (int_set_contains(d, BGP_COMM_NO_EXPORT) ||
        !          1169:           int_set_contains(d, BGP_COMM_NO_EXPORT_SUBCONFED)))
        !          1170:        {
        !          1171:          DBG("\tNO_EXPORT\n");
        !          1172:          return 1;
        !          1173:        }
        !          1174:     }
        !          1175: 
        !          1176:   return 0;
        !          1177: }
        !          1178: 
        !          1179: int
        !          1180: bgp_import_control(struct proto *P, rte **new, ea_list **attrs, struct linpool *pool)
        !          1181: {
        !          1182:   rte *e = *new;
        !          1183:   struct bgp_proto *p = (struct bgp_proto *) P;
        !          1184:   struct bgp_proto *new_bgp = (e->attrs->src->proto->proto == &proto_bgp) ?
        !          1185:     (struct bgp_proto *) e->attrs->src->proto : NULL;
        !          1186: 
        !          1187:   if (p == new_bgp)                    /* Poison reverse updates */
        !          1188:     return -1;
        !          1189:   if (new_bgp)
        !          1190:     {
        !          1191:       /* We should check here for cluster list loop, because the receiving BGP instance
        !          1192:         might have different cluster ID  */
        !          1193:       if (bgp_cluster_list_loopy(p, e->attrs))
        !          1194:        return -1;
        !          1195: 
        !          1196:       if (p->cf->interpret_communities && bgp_community_filter(p, e))
        !          1197:        return -1;
        !          1198: 
        !          1199:       if (p->local_as == new_bgp->local_as && p->is_internal && new_bgp->is_internal)
        !          1200:        {
        !          1201:          /* Redistribution of internal routes with IBGP */
        !          1202:          if (p->rr_client || new_bgp->rr_client)
        !          1203:            /* Route reflection, RFC 4456 */
        !          1204:            return bgp_update_attrs(p, e, attrs, pool, 1);
        !          1205:          else
        !          1206:            return -1;
        !          1207:        }
        !          1208:       else
        !          1209:        return bgp_update_attrs(p, e, attrs, pool, 0);
        !          1210:     }
        !          1211:   else
        !          1212:     return bgp_create_attrs(p, e, attrs, pool);
        !          1213: }
        !          1214: 
        !          1215: static inline u32
        !          1216: bgp_get_neighbor(rte *r)
        !          1217: {
        !          1218:   eattr *e = ea_find(r->attrs->eattrs, EA_CODE(EAP_BGP, BA_AS_PATH));
        !          1219:   u32 as;
        !          1220: 
        !          1221:   if (e && as_path_get_first(e->u.ptr, &as))
        !          1222:     return as;
        !          1223:   else
        !          1224:     return ((struct bgp_proto *) r->attrs->src->proto)->remote_as;
        !          1225: }
        !          1226: 
        !          1227: static inline int
        !          1228: rte_resolvable(rte *rt)
        !          1229: {
        !          1230:   int rd = rt->attrs->dest;  
        !          1231:   return (rd == RTD_ROUTER) || (rd == RTD_DEVICE) || (rd == RTD_MULTIPATH);
        !          1232: }
        !          1233: 
        !          1234: int
        !          1235: bgp_rte_better(rte *new, rte *old)
        !          1236: {
        !          1237:   struct bgp_proto *new_bgp = (struct bgp_proto *) new->attrs->src->proto;
        !          1238:   struct bgp_proto *old_bgp = (struct bgp_proto *) old->attrs->src->proto;
        !          1239:   eattr *x, *y;
        !          1240:   u32 n, o;
        !          1241: 
        !          1242:   /* Skip suppressed routes (see bgp_rte_recalculate()) */
        !          1243:   n = new->u.bgp.suppressed;
        !          1244:   o = old->u.bgp.suppressed;
        !          1245:   if (n > o)
        !          1246:     return 0;
        !          1247:   if (n < o)
        !          1248:     return 1;
        !          1249: 
        !          1250:   /* RFC 4271 9.1.2.1. Route resolvability test */
        !          1251:   n = rte_resolvable(new);
        !          1252:   o = rte_resolvable(old);
        !          1253:   if (n > o)
        !          1254:     return 1;
        !          1255:   if (n < o)
        !          1256:     return 0;
        !          1257: 
        !          1258:   /* Start with local preferences */
        !          1259:   x = ea_find(new->attrs->eattrs, EA_CODE(EAP_BGP, BA_LOCAL_PREF));
        !          1260:   y = ea_find(old->attrs->eattrs, EA_CODE(EAP_BGP, BA_LOCAL_PREF));
        !          1261:   n = x ? x->u.data : new_bgp->cf->default_local_pref;
        !          1262:   o = y ? y->u.data : old_bgp->cf->default_local_pref;
        !          1263:   if (n > o)
        !          1264:     return 1;
        !          1265:   if (n < o)
        !          1266:     return 0;
        !          1267: 
        !          1268:   /* RFC 4271 9.1.2.2. a)  Use AS path lengths */
        !          1269:   if (new_bgp->cf->compare_path_lengths || old_bgp->cf->compare_path_lengths)
        !          1270:     {
        !          1271:       x = ea_find(new->attrs->eattrs, EA_CODE(EAP_BGP, BA_AS_PATH));
        !          1272:       y = ea_find(old->attrs->eattrs, EA_CODE(EAP_BGP, BA_AS_PATH));
        !          1273:       n = x ? as_path_getlen(x->u.ptr) : AS_PATH_MAXLEN;
        !          1274:       o = y ? as_path_getlen(y->u.ptr) : AS_PATH_MAXLEN;
        !          1275:       if (n < o)
        !          1276:        return 1;
        !          1277:       if (n > o)
        !          1278:        return 0;
        !          1279:     }
        !          1280: 
        !          1281:   /* RFC 4271 9.1.2.2. b) Use origins */
        !          1282:   x = ea_find(new->attrs->eattrs, EA_CODE(EAP_BGP, BA_ORIGIN));
        !          1283:   y = ea_find(old->attrs->eattrs, EA_CODE(EAP_BGP, BA_ORIGIN));
        !          1284:   n = x ? x->u.data : ORIGIN_INCOMPLETE;
        !          1285:   o = y ? y->u.data : ORIGIN_INCOMPLETE;
        !          1286:   if (n < o)
        !          1287:     return 1;
        !          1288:   if (n > o)
        !          1289:     return 0;
        !          1290: 
        !          1291:   /* RFC 4271 9.1.2.2. c) Compare MED's */
        !          1292:   /* Proper RFC 4271 path selection cannot be interpreted as finding
        !          1293:    * the best path in some ordering. It is implemented partially in
        !          1294:    * bgp_rte_recalculate() when deterministic_med option is
        !          1295:    * active. Without that option, the behavior is just an
        !          1296:    * approximation, which in specific situations may lead to
        !          1297:    * persistent routing loops, because it is nondeterministic - it
        !          1298:    * depends on the order in which routes appeared. But it is also the
        !          1299:    * same behavior as used by default in Cisco routers, so it is
        !          1300:    * probably not a big issue.
        !          1301:    */
        !          1302:   if (new_bgp->cf->med_metric || old_bgp->cf->med_metric ||
        !          1303:       (bgp_get_neighbor(new) == bgp_get_neighbor(old)))
        !          1304:     {
        !          1305:       x = ea_find(new->attrs->eattrs, EA_CODE(EAP_BGP, BA_MULTI_EXIT_DISC));
        !          1306:       y = ea_find(old->attrs->eattrs, EA_CODE(EAP_BGP, BA_MULTI_EXIT_DISC));
        !          1307:       n = x ? x->u.data : new_bgp->cf->default_med;
        !          1308:       o = y ? y->u.data : old_bgp->cf->default_med;
        !          1309:       if (n < o)
        !          1310:        return 1;
        !          1311:       if (n > o)
        !          1312:        return 0;
        !          1313:     }
        !          1314: 
        !          1315:   /* RFC 4271 9.1.2.2. d) Prefer external peers */
        !          1316:   if (new_bgp->is_internal > old_bgp->is_internal)
        !          1317:     return 0;
        !          1318:   if (new_bgp->is_internal < old_bgp->is_internal)
        !          1319:     return 1;
        !          1320: 
        !          1321:   /* RFC 4271 9.1.2.2. e) Compare IGP metrics */
        !          1322:   n = new_bgp->cf->igp_metric ? new->attrs->igp_metric : 0;
        !          1323:   o = old_bgp->cf->igp_metric ? old->attrs->igp_metric : 0;
        !          1324:   if (n < o)
        !          1325:     return 1;
        !          1326:   if (n > o)
        !          1327:     return 0;
        !          1328: 
        !          1329:   /* RFC 4271 9.1.2.2. f) Compare BGP identifiers */
        !          1330:   /* RFC 4456 9. a) Use ORIGINATOR_ID instead of local neighor ID */
        !          1331:   x = ea_find(new->attrs->eattrs, EA_CODE(EAP_BGP, BA_ORIGINATOR_ID));
        !          1332:   y = ea_find(old->attrs->eattrs, EA_CODE(EAP_BGP, BA_ORIGINATOR_ID));
        !          1333:   n = x ? x->u.data : new_bgp->remote_id;
        !          1334:   o = y ? y->u.data : old_bgp->remote_id;
        !          1335: 
        !          1336:   /* RFC 5004 - prefer older routes */
        !          1337:   /* (if both are external and from different peer) */
        !          1338:   if ((new_bgp->cf->prefer_older || old_bgp->cf->prefer_older) &&
        !          1339:       !new_bgp->is_internal && n != o)
        !          1340:     return 0;
        !          1341: 
        !          1342:   /* rest of RFC 4271 9.1.2.2. f) */
        !          1343:   if (n < o)
        !          1344:     return 1;
        !          1345:   if (n > o)
        !          1346:     return 0;
        !          1347: 
        !          1348:   /* RFC 4456 9. b) Compare cluster list lengths */
        !          1349:   x = ea_find(new->attrs->eattrs, EA_CODE(EAP_BGP, BA_CLUSTER_LIST));
        !          1350:   y = ea_find(old->attrs->eattrs, EA_CODE(EAP_BGP, BA_CLUSTER_LIST));
        !          1351:   n = x ? int_set_get_size(x->u.ptr) : 0;
        !          1352:   o = y ? int_set_get_size(y->u.ptr) : 0;
        !          1353:   if (n < o)
        !          1354:     return 1;
        !          1355:   if (n > o)
        !          1356:     return 0;
        !          1357: 
        !          1358:   /* RFC 4271 9.1.2.2. g) Compare peer IP adresses */
        !          1359:   return (ipa_compare(new_bgp->cf->remote_ip, old_bgp->cf->remote_ip) < 0);
        !          1360: }
        !          1361: 
        !          1362: 
        !          1363: int
        !          1364: bgp_rte_mergable(rte *pri, rte *sec)
        !          1365: {
        !          1366:   struct bgp_proto *pri_bgp = (struct bgp_proto *) pri->attrs->src->proto;
        !          1367:   struct bgp_proto *sec_bgp = (struct bgp_proto *) sec->attrs->src->proto;
        !          1368:   eattr *x, *y;
        !          1369:   u32 p, s;
        !          1370: 
        !          1371:   /* Skip suppressed routes (see bgp_rte_recalculate()) */
        !          1372:   if (pri->u.bgp.suppressed != sec->u.bgp.suppressed)
        !          1373:     return 0;
        !          1374: 
        !          1375:   /* RFC 4271 9.1.2.1. Route resolvability test */
        !          1376:   if (!rte_resolvable(sec))
        !          1377:     return 0;
        !          1378: 
        !          1379:   /* Start with local preferences */
        !          1380:   x = ea_find(pri->attrs->eattrs, EA_CODE(EAP_BGP, BA_LOCAL_PREF));
        !          1381:   y = ea_find(sec->attrs->eattrs, EA_CODE(EAP_BGP, BA_LOCAL_PREF));
        !          1382:   p = x ? x->u.data : pri_bgp->cf->default_local_pref;
        !          1383:   s = y ? y->u.data : sec_bgp->cf->default_local_pref;
        !          1384:   if (p != s)
        !          1385:     return 0;
        !          1386: 
        !          1387:   /* RFC 4271 9.1.2.2. a)  Use AS path lengths */
        !          1388:   if (pri_bgp->cf->compare_path_lengths || sec_bgp->cf->compare_path_lengths)
        !          1389:     {
        !          1390:       x = ea_find(pri->attrs->eattrs, EA_CODE(EAP_BGP, BA_AS_PATH));
        !          1391:       y = ea_find(sec->attrs->eattrs, EA_CODE(EAP_BGP, BA_AS_PATH));
        !          1392:       p = x ? as_path_getlen(x->u.ptr) : AS_PATH_MAXLEN;
        !          1393:       s = y ? as_path_getlen(y->u.ptr) : AS_PATH_MAXLEN;
        !          1394: 
        !          1395:       if (p != s)
        !          1396:        return 0;
        !          1397: 
        !          1398: //      if (DELTA(p, s) > pri_bgp->cf->relax_multipath)
        !          1399: //     return 0;
        !          1400:     }
        !          1401: 
        !          1402:   /* RFC 4271 9.1.2.2. b) Use origins */
        !          1403:   x = ea_find(pri->attrs->eattrs, EA_CODE(EAP_BGP, BA_ORIGIN));
        !          1404:   y = ea_find(sec->attrs->eattrs, EA_CODE(EAP_BGP, BA_ORIGIN));
        !          1405:   p = x ? x->u.data : ORIGIN_INCOMPLETE;
        !          1406:   s = y ? y->u.data : ORIGIN_INCOMPLETE;
        !          1407:   if (p != s)
        !          1408:     return 0;
        !          1409: 
        !          1410:   /* RFC 4271 9.1.2.2. c) Compare MED's */
        !          1411:   if (pri_bgp->cf->med_metric || sec_bgp->cf->med_metric ||
        !          1412:       (bgp_get_neighbor(pri) == bgp_get_neighbor(sec)))
        !          1413:     {
        !          1414:       x = ea_find(pri->attrs->eattrs, EA_CODE(EAP_BGP, BA_MULTI_EXIT_DISC));
        !          1415:       y = ea_find(sec->attrs->eattrs, EA_CODE(EAP_BGP, BA_MULTI_EXIT_DISC));
        !          1416:       p = x ? x->u.data : pri_bgp->cf->default_med;
        !          1417:       s = y ? y->u.data : sec_bgp->cf->default_med;
        !          1418:       if (p != s)
        !          1419:        return 0;
        !          1420:     }
        !          1421: 
        !          1422:   /* RFC 4271 9.1.2.2. d) Prefer external peers */
        !          1423:   if (pri_bgp->is_internal != sec_bgp->is_internal)
        !          1424:     return 0;
        !          1425: 
        !          1426:   /* RFC 4271 9.1.2.2. e) Compare IGP metrics */
        !          1427:   p = pri_bgp->cf->igp_metric ? pri->attrs->igp_metric : 0;
        !          1428:   s = sec_bgp->cf->igp_metric ? sec->attrs->igp_metric : 0;
        !          1429:   if (p != s)
        !          1430:     return 0;
        !          1431: 
        !          1432:   /* Remaining criteria are ignored */
        !          1433: 
        !          1434:   return 1;
        !          1435: }
        !          1436: 
        !          1437: 
        !          1438: 
        !          1439: static inline int
        !          1440: same_group(rte *r, u32 lpref, u32 lasn)
        !          1441: {
        !          1442:   return (r->pref == lpref) && (bgp_get_neighbor(r) == lasn);
        !          1443: }
        !          1444: 
        !          1445: static inline int
        !          1446: use_deterministic_med(rte *r)
        !          1447: {
        !          1448:   struct proto *P = r->attrs->src->proto;
        !          1449:   return (P->proto == &proto_bgp) && ((struct bgp_proto *) P)->cf->deterministic_med;
        !          1450: }
        !          1451: 
        !          1452: int
        !          1453: bgp_rte_recalculate(rtable *table, net *net, rte *new, rte *old, rte *old_best)
        !          1454: {
        !          1455:   rte *r, *s;
        !          1456:   rte *key = new ? new : old;
        !          1457:   u32 lpref = key->pref;
        !          1458:   u32 lasn = bgp_get_neighbor(key);
        !          1459:   int old_is_group_best = 0;
        !          1460: 
        !          1461:   /*
        !          1462:    * Proper RFC 4271 path selection is a bit complicated, it cannot be
        !          1463:    * implemented just by rte_better(), because it is not a linear
        !          1464:    * ordering. But it can be splitted to two levels, where the lower
        !          1465:    * level chooses the best routes in each group of routes from the
        !          1466:    * same neighboring AS and higher level chooses the best route (with
        !          1467:    * a slightly different ordering) between the best-in-group routes.
        !          1468:    *
        !          1469:    * When deterministic_med is disabled, we just ignore this issue and
        !          1470:    * choose the best route by bgp_rte_better() alone. If enabled, the
        !          1471:    * lower level of the route selection is done here (for the group
        !          1472:    * to which the changed route belongs), all routes in group are
        !          1473:    * marked as suppressed, just chosen best-in-group is not.
        !          1474:    *
        !          1475:    * Global best route selection then implements higher level by
        !          1476:    * choosing between non-suppressed routes (as they are always
        !          1477:    * preferred over suppressed routes). Routes from BGP protocols
        !          1478:    * that do not set deterministic_med are just never suppressed. As
        !          1479:    * they do not participate in the lower level selection, it is OK
        !          1480:    * that this fn is not called for them.
        !          1481:    *
        !          1482:    * The idea is simple, the implementation is more problematic,
        !          1483:    * mostly because of optimizations in rte_recalculate() that 
        !          1484:    * avoids full recalculation in most cases.
        !          1485:    *
        !          1486:    * We can assume that at least one of new, old is non-NULL and both
        !          1487:    * are from the same protocol with enabled deterministic_med. We
        !          1488:    * group routes by both neighbor AS (lasn) and preference (lpref),
        !          1489:    * because bgp_rte_better() does not handle preference itself.
        !          1490:    */
        !          1491: 
        !          1492:   /* If new and old are from different groups, we just process that
        !          1493:      as two independent events */
        !          1494:   if (new && old && !same_group(old, lpref, lasn))
        !          1495:     {
        !          1496:       int i1, i2;
        !          1497:       i1 = bgp_rte_recalculate(table, net, NULL, old, old_best);
        !          1498:       i2 = bgp_rte_recalculate(table, net, new, NULL, old_best);
        !          1499:       return i1 || i2;
        !          1500:     }
        !          1501: 
        !          1502:   /* 
        !          1503:    * We could find the best-in-group and then make some shortcuts like
        !          1504:    * in rte_recalculate, but as we would have to walk through all
        !          1505:    * net->routes just to find it, it is probably not worth. So we
        !          1506:    * just have two simpler fast cases that use just the old route.
        !          1507:    * We also set suppressed flag to avoid using it in bgp_rte_better().
        !          1508:    */
        !          1509: 
        !          1510:   if (new)
        !          1511:     new->u.bgp.suppressed = 1;
        !          1512: 
        !          1513:   if (old)
        !          1514:     {
        !          1515:       old_is_group_best = !old->u.bgp.suppressed;
        !          1516:       old->u.bgp.suppressed = 1;
        !          1517:       int new_is_better = new && bgp_rte_better(new, old);
        !          1518: 
        !          1519:       /* The first case - replace not best with worse (or remove not best) */
        !          1520:       if (!old_is_group_best && !new_is_better)
        !          1521:        return 0;
        !          1522: 
        !          1523:       /* The second case - replace the best with better */
        !          1524:       if (old_is_group_best && new_is_better)
        !          1525:        {
        !          1526:          /* new is best-in-group, the see discussion below - this is
        !          1527:             a special variant of NBG && OBG. From OBG we can deduce
        !          1528:             that same_group(old_best) iff (old == old_best)  */
        !          1529:          new->u.bgp.suppressed = 0;
        !          1530:          return (old == old_best);
        !          1531:        }
        !          1532:     }
        !          1533: 
        !          1534:   /* The default case - find a new best-in-group route */
        !          1535:   r = new; /* new may not be in the list */
        !          1536:   for (s=net->routes; rte_is_valid(s); s=s->next)
        !          1537:     if (use_deterministic_med(s) && same_group(s, lpref, lasn))
        !          1538:       {
        !          1539:        s->u.bgp.suppressed = 1;
        !          1540:        if (!r || bgp_rte_better(s, r))
        !          1541:          r = s;
        !          1542:       }
        !          1543: 
        !          1544:   /* Simple case - the last route in group disappears */
        !          1545:   if (!r)
        !          1546:     return 0;
        !          1547: 
        !          1548:   /* Found best-in-group */
        !          1549:   r->u.bgp.suppressed = 0;
        !          1550: 
        !          1551:   /*
        !          1552:    * There are generally two reasons why we have to force
        !          1553:    * recalculation (return 1): First, the new route may be wrongfully
        !          1554:    * chosen to be the best in the first case check in
        !          1555:    * rte_recalculate(), this may happen only if old_best is from the
        !          1556:    * same group. Second, another (different than new route)
        !          1557:    * best-in-group is chosen and that may be the proper best (although
        !          1558:    * rte_recalculate() without ignore that possibility).
        !          1559:    *
        !          1560:    * There are three possible cases according to whether the old route
        !          1561:    * was the best in group (OBG, stored in old_is_group_best) and
        !          1562:    * whether the new route is the best in group (NBG, tested by r == new).
        !          1563:    * These cases work even if old or new is NULL.
        !          1564:    *
        !          1565:    * NBG -> new is a possible candidate for the best route, so we just
        !          1566:    *        check for the first reason using same_group().
        !          1567:    *
        !          1568:    * !NBG && OBG -> Second reason applies, return 1
        !          1569:    *
        !          1570:    * !NBG && !OBG -> Best in group does not change, old != old_best,
        !          1571:    *                 rte_better(new, old_best) is false and therefore
        !          1572:    *                 the first reason does not apply, return 0
        !          1573:    */
        !          1574: 
        !          1575:   if (r == new)
        !          1576:     return old_best && same_group(old_best, lpref, lasn);
        !          1577:   else
        !          1578:     return old_is_group_best;
        !          1579: }
        !          1580: 
        !          1581: static struct adata *
        !          1582: bgp_aggregator_convert_to_new(struct adata *old, struct linpool *pool)
        !          1583: {
        !          1584:   struct adata *newa = lp_alloc(pool, sizeof(struct adata) + 8);
        !          1585:   newa->length = 8;
        !          1586:   aggregator_convert_to_new(old, newa->data);
        !          1587:   return newa;
        !          1588: }
        !          1589: 
        !          1590: 
        !          1591: /* Take last req_as ASNs from path old2 (in 2B format), convert to 4B format
        !          1592:  * and append path old4 (in 4B format).
        !          1593:  */
        !          1594: static struct adata *
        !          1595: bgp_merge_as_paths(struct adata *old2, struct adata *old4, int req_as, struct linpool *pool)
        !          1596: {
        !          1597:   byte buf[old2->length * 2];
        !          1598: 
        !          1599:   int ol = as_path_convert_to_new(old2, buf, req_as);
        !          1600:   int nl = ol + (old4 ? old4->length : 0);
        !          1601: 
        !          1602:   struct adata *newa = lp_alloc(pool, sizeof(struct adata) + nl);
        !          1603:   newa->length = nl;
        !          1604:   memcpy(newa->data, buf, ol);
        !          1605:   if (old4) memcpy(newa->data + ol, old4->data, old4->length);
        !          1606: 
        !          1607:   return newa;
        !          1608: }
        !          1609: 
        !          1610: static int
        !          1611: as4_aggregator_valid(struct adata *aggr)
        !          1612: {
        !          1613:   return aggr->length == 8;
        !          1614: }
        !          1615: 
        !          1616: 
        !          1617: /* Reconstruct 4B AS_PATH and AGGREGATOR according to RFC 4893 4.2.3 */
        !          1618: static void
        !          1619: bgp_reconstruct_4b_atts(struct bgp_proto *p, rta *a, struct linpool *pool)
        !          1620: {
        !          1621:   eattr *p2 =ea_find(a->eattrs, EA_CODE(EAP_BGP, BA_AS_PATH));
        !          1622:   eattr *p4 =ea_find(a->eattrs, EA_CODE(EAP_BGP, BA_AS4_PATH));
        !          1623:   eattr *a2 =ea_find(a->eattrs, EA_CODE(EAP_BGP, BA_AGGREGATOR));
        !          1624:   eattr *a4 =ea_find(a->eattrs, EA_CODE(EAP_BGP, BA_AS4_AGGREGATOR));
        !          1625:   int a4_removed = 0;
        !          1626: 
        !          1627:   if (a4 && !as4_aggregator_valid(a4->u.ptr))
        !          1628:     {
        !          1629:       log(L_WARN "%s: AS4_AGGREGATOR attribute is invalid, skipping attribute", p->p.name);
        !          1630:       a4 = NULL;
        !          1631:       a4_removed = 1;
        !          1632:     }
        !          1633: 
        !          1634:   if (a2)
        !          1635:     {
        !          1636:       u32 a2_as = get_u16(a2->u.ptr->data);
        !          1637: 
        !          1638:       if (a4)
        !          1639:        {
        !          1640:          if (a2_as != AS_TRANS)
        !          1641:            {
        !          1642:              /* Routes were aggregated by old router and therefore AS4_PATH
        !          1643:               * and AS4_AGGREGATOR is invalid
        !          1644:               *
        !          1645:               * Convert AS_PATH and AGGREGATOR to 4B format and finish.
        !          1646:               */
        !          1647: 
        !          1648:              a2->u.ptr = bgp_aggregator_convert_to_new(a2->u.ptr, pool);
        !          1649:              p2->u.ptr = bgp_merge_as_paths(p2->u.ptr, NULL, AS_PATH_MAXLEN, pool);
        !          1650: 
        !          1651:              return;
        !          1652:            }
        !          1653:          else
        !          1654:            {
        !          1655:              /* Common case, use AS4_AGGREGATOR attribute */
        !          1656:              a2->u.ptr = a4->u.ptr;
        !          1657:            }
        !          1658:        }
        !          1659:       else
        !          1660:        {
        !          1661:          /* Common case, use old AGGREGATOR attribute */
        !          1662:          a2->u.ptr = bgp_aggregator_convert_to_new(a2->u.ptr, pool);
        !          1663: 
        !          1664:          if ((a2_as == AS_TRANS) && !a4_removed)
        !          1665:            log(L_WARN "%s: AGGREGATOR attribute contain AS_TRANS, but AS4_AGGREGATOR is missing", p->p.name);
        !          1666:        }
        !          1667:     }
        !          1668:   else
        !          1669:     if (a4)
        !          1670:       log(L_WARN "%s: AS4_AGGREGATOR attribute received, but AGGREGATOR attribute is missing", p->p.name);
        !          1671: 
        !          1672:   int p2_len = as_path_getlen_int(p2->u.ptr, 2);
        !          1673:   int p4_len = p4 ? validate_as4_path(p, p4->u.ptr) : -1;
        !          1674: 
        !          1675:   if (p4 && (p4_len < 0))
        !          1676:     log(L_WARN "%s: AS4_PATH attribute is malformed, skipping attribute", p->p.name);
        !          1677: 
        !          1678:   if ((p4_len <= 0) || (p2_len < p4_len))
        !          1679:     p2->u.ptr = bgp_merge_as_paths(p2->u.ptr, NULL, AS_PATH_MAXLEN, pool);
        !          1680:   else
        !          1681:     p2->u.ptr = bgp_merge_as_paths(p2->u.ptr, p4->u.ptr, p2_len - p4_len, pool);
        !          1682: }
        !          1683: 
        !          1684: static void
        !          1685: bgp_remove_as4_attrs(struct bgp_proto *p, rta *a)
        !          1686: {
        !          1687:   unsigned id1 = EA_CODE(EAP_BGP, BA_AS4_PATH);
        !          1688:   unsigned id2 = EA_CODE(EAP_BGP, BA_AS4_AGGREGATOR);
        !          1689:   ea_list **el = &(a->eattrs);
        !          1690: 
        !          1691:   /* We know that ea_lists constructed in bgp_decode attrs have one attribute per ea_list struct */
        !          1692:   while (*el != NULL)
        !          1693:     {
        !          1694:       unsigned fid = (*el)->attrs[0].id;
        !          1695: 
        !          1696:       if ((fid == id1) || (fid == id2))
        !          1697:        {
        !          1698:          *el = (*el)->next;
        !          1699:          if (p->as4_session)
        !          1700:            log(L_WARN "%s: Unexpected AS4_* attributes received", p->p.name);
        !          1701:        }
        !          1702:       else
        !          1703:        el = &((*el)->next);
        !          1704:     }
        !          1705: }
        !          1706: 
        !          1707: /**
        !          1708:  * bgp_decode_attrs - check and decode BGP attributes
        !          1709:  * @conn: connection
        !          1710:  * @attr: start of attribute block
        !          1711:  * @len: length of attribute block
        !          1712:  * @pool: linear pool to make all the allocations in
        !          1713:  * @mandatory: 1 iff presence of mandatory attributes has to be checked
        !          1714:  *
        !          1715:  * This function takes a BGP attribute block (a part of an Update message), checks
        !          1716:  * its consistency and converts it to a list of BIRD route attributes represented
        !          1717:  * by a &rta.
        !          1718:  */
        !          1719: struct rta *
        !          1720: bgp_decode_attrs(struct bgp_conn *conn, byte *attr, uint len, struct linpool *pool, int mandatory)
        !          1721: {
        !          1722:   struct bgp_proto *bgp = conn->bgp;
        !          1723:   rta *a = lp_alloc(pool, sizeof(struct rta));
        !          1724:   uint flags, code, l, i, type;
        !          1725:   int errcode;
        !          1726:   byte *z, *attr_start;
        !          1727:   byte seen[256/8];
        !          1728:   ea_list *ea;
        !          1729:   struct adata *ad;
        !          1730:   int withdraw = 0;
        !          1731: 
        !          1732:   bzero(a, sizeof(rta));
        !          1733:   a->source = RTS_BGP;
        !          1734:   a->scope = SCOPE_UNIVERSE;
        !          1735:   a->cast = RTC_UNICAST;
        !          1736:   /* a->dest = RTD_ROUTER;  -- set in bgp_set_next_hop() */
        !          1737:   a->from = bgp->cf->remote_ip;
        !          1738: 
        !          1739:   /* Parse the attributes */
        !          1740:   bzero(seen, sizeof(seen));
        !          1741:   DBG("BGP: Parsing attributes\n");
        !          1742:   while (len)
        !          1743:     {
        !          1744:       if (len < 2)
        !          1745:        goto malformed;
        !          1746:       attr_start = attr;
        !          1747:       flags = *attr++;
        !          1748:       code = *attr++;
        !          1749:       len -= 2;
        !          1750:       if (flags & BAF_EXT_LEN)
        !          1751:        {
        !          1752:          if (len < 2)
        !          1753:            goto malformed;
        !          1754:          l = get_u16(attr);
        !          1755:          attr += 2;
        !          1756:          len -= 2;
        !          1757:        }
        !          1758:       else
        !          1759:        {
        !          1760:          if (len < 1)
        !          1761:            goto malformed;
        !          1762:          l = *attr++;
        !          1763:          len--;
        !          1764:        }
        !          1765:       if (l > len)
        !          1766:        goto malformed;
        !          1767:       len -= l;
        !          1768:       z = attr;
        !          1769:       attr += l;
        !          1770:       DBG("Attr %02x %02x %d\n", code, flags, l);
        !          1771:       if (seen[code/8] & (1 << (code%8)))
        !          1772:        goto malformed;
        !          1773:       if (ATTR_KNOWN(code))
        !          1774:        {
        !          1775:          struct attr_desc *desc = &bgp_attr_table[code];
        !          1776:          if (desc->expected_length >= 0 && desc->expected_length != (int) l)
        !          1777:            { errcode = 5; goto err; }
        !          1778:          if ((desc->expected_flags ^ flags) & (BAF_OPTIONAL | BAF_TRANSITIVE))
        !          1779:            { errcode = 4; goto err; }
        !          1780:          if (!desc->allow_in_ebgp && !bgp->is_internal)
        !          1781:            continue;
        !          1782:          if (desc->validate)
        !          1783:            {
        !          1784:              errcode = desc->validate(bgp, z, l);
        !          1785:              if (errcode > 0)
        !          1786:                goto err;
        !          1787:              if (errcode == IGNORE)
        !          1788:                continue;
        !          1789:              if (errcode <= WITHDRAW)
        !          1790:                {
        !          1791:                  log(L_WARN "%s: Attribute %s is malformed, withdrawing update",
        !          1792:                      bgp->p.name, desc->name);
        !          1793:                  withdraw = 1;
        !          1794:                }
        !          1795:            }
        !          1796:          else if (code == BA_AS_PATH)
        !          1797:            {
        !          1798:              /* Special case as it might also trim the attribute */
        !          1799:              if (validate_as_path(bgp, z, &l) < 0)
        !          1800:                { errcode = 11; goto err; }
        !          1801:            }
        !          1802:          type = desc->type;
        !          1803:        }
        !          1804:       else                             /* Unknown attribute */
        !          1805:        {
        !          1806:          if (!(flags & BAF_OPTIONAL))
        !          1807:            { errcode = 2; goto err; }
        !          1808:          type = EAF_TYPE_OPAQUE;
        !          1809:        }
        !          1810:       
        !          1811:       // Only OPTIONAL and TRANSITIVE attributes may have non-zero PARTIAL flag
        !          1812:       // if (!((flags & BAF_OPTIONAL) && (flags & BAF_TRANSITIVE)) && (flags & BAF_PARTIAL))
        !          1813:       //   { errcode = 4; goto err; }
        !          1814: 
        !          1815:       seen[code/8] |= (1 << (code%8));
        !          1816:       ea = lp_alloc(pool, sizeof(ea_list) + sizeof(eattr));
        !          1817:       ea->next = a->eattrs;
        !          1818:       a->eattrs = ea;
        !          1819:       ea->flags = 0;
        !          1820:       ea->count = 1;
        !          1821:       ea->attrs[0].id = EA_CODE(EAP_BGP, code);
        !          1822:       ea->attrs[0].flags = flags;
        !          1823:       ea->attrs[0].type = type;
        !          1824:       if (type & EAF_EMBEDDED)
        !          1825:        ad = NULL;
        !          1826:       else
        !          1827:        {
        !          1828:          ad = lp_alloc(pool, sizeof(struct adata) + l);
        !          1829:          ea->attrs[0].u.ptr = ad;
        !          1830:          ad->length = l;
        !          1831:          memcpy(ad->data, z, l);
        !          1832:        }
        !          1833:       switch (type)
        !          1834:        {
        !          1835:        case EAF_TYPE_ROUTER_ID:
        !          1836:        case EAF_TYPE_INT:
        !          1837:          if (l == 1)
        !          1838:            ea->attrs[0].u.data = *z;
        !          1839:          else
        !          1840:            ea->attrs[0].u.data = get_u32(z);
        !          1841:          break;
        !          1842:        case EAF_TYPE_IP_ADDRESS:
        !          1843:          ipa_ntoh(*(ip_addr *)ad->data);
        !          1844:          break;
        !          1845:        case EAF_TYPE_INT_SET:
        !          1846:        case EAF_TYPE_LC_SET:
        !          1847:        case EAF_TYPE_EC_SET:
        !          1848:          {
        !          1849:            u32 *z = (u32 *) ad->data;
        !          1850:            for(i=0; i<ad->length/4; i++)
        !          1851:              z[i] = ntohl(z[i]);
        !          1852:            break;
        !          1853:          }
        !          1854:        }
        !          1855:     }
        !          1856: 
        !          1857:   if (withdraw)
        !          1858:     goto withdraw;
        !          1859: 
        !          1860: #ifdef IPV6
        !          1861:   /* If we received MP_REACH_NLRI we should check mandatory attributes */
        !          1862:   if (bgp->mp_reach_len != 0)
        !          1863:     mandatory = 1;
        !          1864: #endif
        !          1865: 
        !          1866:   /* If there is no (reachability) NLRI, we should exit now */
        !          1867:   if (! mandatory)
        !          1868:     return a;
        !          1869: 
        !          1870:   /* Check if all mandatory attributes are present */
        !          1871:   for(i=0; i < ARRAY_SIZE(bgp_mandatory_attrs); i++)
        !          1872:     {
        !          1873:       code = bgp_mandatory_attrs[i];
        !          1874:       if (!(seen[code/8] & (1 << (code%8))))
        !          1875:        {
        !          1876:          bgp_error(conn, 3, 3, &bgp_mandatory_attrs[i], 1);
        !          1877:          return NULL;
        !          1878:        }
        !          1879:     }
        !          1880: 
        !          1881:   /* When receiving attributes from non-AS4-aware BGP speaker,
        !          1882:    * we have to reconstruct 4B AS_PATH and AGGREGATOR attributes
        !          1883:    */
        !          1884:   if (! bgp->as4_session)
        !          1885:     bgp_reconstruct_4b_atts(bgp, a, pool);
        !          1886: 
        !          1887:   bgp_remove_as4_attrs(bgp, a);
        !          1888: 
        !          1889:   /* If the AS path attribute contains our AS, reject the routes */
        !          1890:   if (bgp_as_path_loopy(bgp, a))
        !          1891:     goto withdraw;
        !          1892: 
        !          1893:   /* Two checks for IBGP loops caused by route reflection, RFC 4456 */ 
        !          1894:   if (bgp_originator_id_loopy(bgp, a) ||
        !          1895:       bgp_cluster_list_loopy(bgp, a))
        !          1896:     goto withdraw;
        !          1897: 
        !          1898:   /* If there's no local preference, define one */
        !          1899:   if (!(seen[0] & (1 << BA_LOCAL_PREF)))
        !          1900:     bgp_attach_attr(&a->eattrs, pool, BA_LOCAL_PREF, bgp->cf->default_local_pref);
        !          1901: 
        !          1902:   return a;
        !          1903: 
        !          1904: withdraw:
        !          1905:   return NULL;
        !          1906: 
        !          1907: malformed:
        !          1908:   bgp_error(conn, 3, 1, NULL, 0);
        !          1909:   return NULL;
        !          1910: 
        !          1911: err:
        !          1912:   bgp_error(conn, 3, errcode, attr_start, z+l-attr_start);
        !          1913:   return NULL;
        !          1914: }
        !          1915: 
        !          1916: int
        !          1917: bgp_get_attr(eattr *a, byte *buf, int buflen)
        !          1918: {
        !          1919:   uint i = EA_ID(a->id);
        !          1920:   struct attr_desc *d;
        !          1921:   int len;
        !          1922: 
        !          1923:   if (ATTR_KNOWN(i))
        !          1924:     {
        !          1925:       d = &bgp_attr_table[i];
        !          1926:       len = bsprintf(buf, "%s", d->name);
        !          1927:       buf += len;
        !          1928:       if (d->format)
        !          1929:        {
        !          1930:          *buf++ = ':';
        !          1931:          *buf++ = ' ';
        !          1932:          d->format(a, buf, buflen - len - 2);
        !          1933:          return GA_FULL;
        !          1934:        }
        !          1935:       return GA_NAME;
        !          1936:     }
        !          1937:   bsprintf(buf, "%02x%s", i, (a->flags & BAF_TRANSITIVE) ? " [t]" : "");
        !          1938:   return GA_NAME;
        !          1939: }
        !          1940: 
        !          1941: void
        !          1942: bgp_init_bucket_table(struct bgp_proto *p)
        !          1943: {
        !          1944:   p->hash_size = 256;
        !          1945:   p->hash_limit = p->hash_size * 4;
        !          1946:   p->bucket_hash = mb_allocz(p->p.pool, p->hash_size * sizeof(struct bgp_bucket *));
        !          1947:   init_list(&p->bucket_queue);
        !          1948:   p->withdraw_bucket = NULL;
        !          1949:   // fib_init(&p->prefix_fib, p->p.pool, sizeof(struct bgp_prefix), 0, bgp_init_prefix);
        !          1950: }
        !          1951: 
        !          1952: void
        !          1953: bgp_free_bucket_table(struct bgp_proto *p)
        !          1954: {
        !          1955:   mb_free(p->bucket_hash);
        !          1956:   p->bucket_hash = NULL;
        !          1957: 
        !          1958:   struct bgp_bucket *b;
        !          1959:   WALK_LIST_FIRST(b, p->bucket_queue)
        !          1960:   {
        !          1961:     rem_node(&b->send_node);
        !          1962:     mb_free(b);
        !          1963:   }
        !          1964: 
        !          1965:   mb_free(p->withdraw_bucket);
        !          1966:   p->withdraw_bucket = NULL;
        !          1967: }
        !          1968: 
        !          1969: void
        !          1970: bgp_get_route_info(rte *e, byte *buf, ea_list *attrs)
        !          1971: {
        !          1972:   eattr *p = ea_find(attrs, EA_CODE(EAP_BGP, BA_AS_PATH));
        !          1973:   eattr *o = ea_find(attrs, EA_CODE(EAP_BGP, BA_ORIGIN));
        !          1974:   u32 origas;
        !          1975: 
        !          1976:   buf += bsprintf(buf, " (%d", e->pref);
        !          1977: 
        !          1978:   if (e->u.bgp.suppressed)
        !          1979:     buf += bsprintf(buf, "-");
        !          1980: 
        !          1981:   if (e->attrs->hostentry)
        !          1982:     {
        !          1983:       if (!rte_resolvable(e))
        !          1984:        buf += bsprintf(buf, "/-");
        !          1985:       else if (e->attrs->igp_metric >= IGP_METRIC_UNKNOWN)
        !          1986:        buf += bsprintf(buf, "/?");
        !          1987:       else
        !          1988:        buf += bsprintf(buf, "/%d", e->attrs->igp_metric);
        !          1989:     }
        !          1990:   buf += bsprintf(buf, ") [");
        !          1991: 
        !          1992:   if (p && as_path_get_last(p->u.ptr, &origas))
        !          1993:     buf += bsprintf(buf, "AS%u", origas);
        !          1994:   if (o)
        !          1995:     buf += bsprintf(buf, "%c", "ie?"[o->u.data]);
        !          1996:   strcpy(buf, "]");
        !          1997: }

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>