jehanne/sys/src/kern/ip/ethermedium.c

783 lines
16 KiB
C

/* Copyright (C) Charles Forsyth
* See /doc/license/NOTICE.Plan9-9k.txt for details about the licensing.
*/
/* Portions of this file are Copyright (C) 2015-2018 Giacomo Tesio <giacomo@tesio.it>
* See /doc/license/gpl-2.0.txt for details about the licensing.
*/
/* Portions of this file are Copyright (C) 9front's team.
* See /doc/license/9front-mit for details about the licensing.
* See http://code.9front.org/hg/plan9front/ for a list of authors.
*/
#include "u.h"
#include "../port/lib.h"
#include "mem.h"
#include "dat.h"
#include "fns.h"
#include "../port/error.h"
#include "../port/netif.h"
#include "ip.h"
#include "ipv6.h"
typedef struct Etherhdr Etherhdr;
struct Etherhdr
{
uint8_t d[6];
uint8_t s[6];
uint8_t t[2];
};
static uint8_t ipbroadcast[IPaddrlen] = {
0xff,0xff,0xff,0xff,
0xff,0xff,0xff,0xff,
0xff,0xff,0xff,0xff,
0xff,0xff,0xff,0xff,
};
static uint8_t etherbroadcast[] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff };
static void etherread4(void *a);
static void etherread6(void *a);
static void etherbind(Ipifc *ifc, int argc, char **argv);
static void etherunbind(Ipifc *ifc);
static void etherbwrite(Ipifc *ifc, Block *bp, int version, uint8_t *ip);
static void etheraddmulti(Ipifc *ifc, uint8_t *a, uint8_t *ia);
static void etherremmulti(Ipifc *ifc, uint8_t *a, uint8_t *ia);
static Block* multicastarp(Fs *f, Arpent *a, Medium*, uint8_t *mac);
static void sendarp(Ipifc *ifc, Arpent *a);
static void sendgarp(Ipifc *ifc, uint8_t*);
static int multicastea(uint8_t *ea, uint8_t *ip);
static void recvarpproc(void*);
static void resolveaddr6(Ipifc *ifc, Arpent *a);
static void etherpref2addr(uint8_t *pref, uint8_t *ea);
Medium ethermedium =
{
.name= "ether",
.hsize= 14,
.mintu= 60,
.maxtu= 1514,
.maclen= 6,
.bind= etherbind,
.unbind= etherunbind,
.bwrite= etherbwrite,
.addmulti= etheraddmulti,
.remmulti= etherremmulti,
.ares= arpenter,
.areg= sendgarp,
.pref2addr= etherpref2addr,
};
Medium gbemedium =
{
.name= "gbe",
.hsize= 14,
.mintu= 60,
.maxtu= 9014,
.maclen= 6,
.bind= etherbind,
.unbind= etherunbind,
.bwrite= etherbwrite,
.addmulti= etheraddmulti,
.remmulti= etherremmulti,
.ares= arpenter,
.areg= sendgarp,
.pref2addr= etherpref2addr,
};
typedef struct Etherrock Etherrock;
struct Etherrock
{
Fs *f; /* file system we belong to */
Proc *arpp; /* arp process */
Proc *read4p; /* reading process (v4)*/
Proc *read6p; /* reading process (v6)*/
Chan *mchan4; /* Data channel for v4 */
Chan *achan; /* Arp channel */
Chan *cchan4; /* Control channel for v4 */
Chan *mchan6; /* Data channel for v6 */
Chan *cchan6; /* Control channel for v6 */
};
/*
* ethernet arp request
*/
enum
{
ETARP = 0x0806,
ETIP4 = 0x0800,
ETIP6 = 0x86DD,
ARPREQUEST = 1,
ARPREPLY = 2,
};
typedef struct Etherarp Etherarp;
struct Etherarp
{
uint8_t d[6];
uint8_t s[6];
uint8_t type[2];
uint8_t hrd[2];
uint8_t pro[2];
uint8_t hln;
uint8_t pln;
uint8_t op[2];
uint8_t sha[6];
uint8_t spa[4];
uint8_t tha[6];
uint8_t tpa[4];
};
static char *nbmsg = "nonblocking";
/*
* called to bind an IP ifc to an ethernet device
* called with ifc wlock'd
*/
static void
etherbind(Ipifc *ifc, int argc, char **argv)
{
Chan *mchan4, *cchan4, *achan, *mchan6, *cchan6, *schan;
char addr[Maxpath]; //char addr[2*KNAMELEN];
char dir[Maxpath]; //char dir[2*KNAMELEN];
char *buf;
int n;
char *ptr;
Etherrock *er;
if(argc < 2)
error(Ebadarg);
mchan4 = cchan4 = achan = mchan6 = cchan6 = nil;
buf = nil;
if(waserror()){
if(mchan4 != nil)
cclose(mchan4);
if(cchan4 != nil)
cclose(cchan4);
if(achan != nil)
cclose(achan);
if(mchan6 != nil)
cclose(mchan6);
if(cchan6 != nil)
cclose(cchan6);
if(buf != nil)
jehanne_free(buf);
nexterror();
}
/*
* open ipv4 conversation
*
* the dial will fail if the type is already open on
* this device.
*/
jehanne_snprint(addr, sizeof(addr), "%s!0x800", argv[2]); /* ETIP4 */
mchan4 = chandial(addr, nil, dir, &cchan4);
/*
* make it non-blocking
*/
cchan4->dev->write(cchan4, nbmsg, jehanne_strlen(nbmsg), 0);
/*
* get mac address and speed
*/
jehanne_snprint(addr, sizeof(addr), "%s/stats", argv[2]);
buf = smalloc(512);
schan = namec(addr, Aopen, OREAD, 0);
if(waserror()){
cclose(schan);
nexterror();
}
n = schan->dev->read(schan, buf, 511, 0);
cclose(schan);
poperror();
buf[n] = 0;
ptr = jehanne_strstr(buf, "addr: ");
if(!ptr)
error(Eio);
ptr += 6;
parsemac(ifc->mac, ptr, 6);
ptr = jehanne_strstr(buf, "mbps: ");
if(ptr){
ptr += 6;
ifc->mbps = jehanne_atoi(ptr);
} else
ifc->mbps = 100;
/*
* open arp conversation
*/
jehanne_snprint(addr, sizeof(addr), "%s!0x806", argv[2]); /* ETARP */
achan = chandial(addr, nil, nil, nil);
/*
* open ipv6 conversation
*
* the dial will fail if the type is already open on
* this device.
*/
jehanne_snprint(addr, sizeof(addr), "%s!0x86DD", argv[2]); /* ETIP6 */
mchan6 = chandial(addr, nil, dir, &cchan6);
/*
* make it non-blocking
*/
cchan6->dev->write(cchan6, nbmsg, jehanne_strlen(nbmsg), 0);
er = smalloc(sizeof(*er));
er->mchan4 = mchan4;
er->cchan4 = cchan4;
er->achan = achan;
er->mchan6 = mchan6;
er->cchan6 = cchan6;
er->f = ifc->conv->p->f;
ifc->arg = er;
jehanne_free(buf);
poperror();
kproc("etherread4", etherread4, ifc);
kproc("recvarpproc", recvarpproc, ifc);
kproc("etherread6", etherread6, ifc);
}
/*
* called with ifc wlock'd
*/
static void
etherunbind(Ipifc *ifc)
{
Etherrock *er = ifc->arg;
if(er->read4p)
postnote(er->read4p, 1, "unbind", 0);
if(er->read6p)
postnote(er->read6p, 1, "unbind", 0);
if(er->arpp)
postnote(er->arpp, 1, "unbind", 0);
/* wait for readers to die */
while(er->arpp != 0 || er->read4p != 0 || er->read6p != 0)
tsleep(&up->sleep, return0, 0, 300);
if(er->mchan4 != nil)
cclose(er->mchan4);
if(er->achan != nil)
cclose(er->achan);
if(er->cchan4 != nil)
cclose(er->cchan4);
if(er->mchan6 != nil)
cclose(er->mchan6);
if(er->cchan6 != nil)
cclose(er->cchan6);
jehanne_free(er);
}
/*
* called by ipoput with a single block to write with ifc rlock'd
*/
static void
etherbwrite(Ipifc *ifc, Block *bp, int version, uint8_t *ip)
{
Etherhdr *eh;
Arpent *a;
uint8_t mac[6];
Etherrock *er = ifc->arg;
/* get mac address of destination */
a = arpget(er->f->arp, bp, version, ifc, ip, mac);
if(a){
/* check for broadcast or multicast */
bp = multicastarp(er->f, a, ifc->medium, mac);
if(bp==nil){
switch(version){
case V4:
sendarp(ifc, a);
break;
case V6:
resolveaddr6(ifc, a);
break;
default:
panic("etherbwrite: version %d", version);
}
return;
}
}
/* make it a single block with space for the ether header */
bp = padblock(bp, ifc->medium->hsize);
if(bp->next)
bp = concatblock(bp);
if(BLEN(bp) < ifc->mintu)
bp = adjustblock(bp, ifc->mintu);
eh = (Etherhdr*)bp->rp;
/* copy in mac addresses and ether type */
jehanne_memmove(eh->s, ifc->mac, sizeof(eh->s));
jehanne_memmove(eh->d, mac, sizeof(eh->d));
switch(version){
case V4:
eh->t[0] = 0x08;
eh->t[1] = 0x00;
er->mchan4->dev->bwrite(er->mchan4, bp, 0);
break;
case V6:
eh->t[0] = 0x86;
eh->t[1] = 0xDD;
er->mchan6->dev->bwrite(er->mchan6, bp, 0);
break;
default:
panic("etherbwrite2: version %d", version);
}
ifc->out++;
}
/*
* process to read from the ethernet
*/
static void
etherread4(void *a)
{
Ipifc *ifc;
Block *bp;
Etherrock *er;
ifc = a;
er = ifc->arg;
er->read4p = up; /* hide identity under a rock for unbind */
if(waserror()){
er->read4p = 0;
pexit("hangup", 1);
}
for(;;){
bp = er->mchan4->dev->bread(er->mchan4, ifc->maxtu, 0);
if(!canrlock(ifc)){
freeb(bp);
continue;
}
if(waserror()){
runlock(ifc);
nexterror();
}
ifc->in++;
if(ifc->lifc == nil || BLEN(bp) <= ifc->medium->hsize)
freeb(bp);
else {
bp->rp += ifc->medium->hsize;
ipiput4(er->f, ifc, bp);
}
runlock(ifc);
poperror();
}
}
/*
* process to read from the ethernet, IPv6
*/
static void
etherread6(void *a)
{
Ipifc *ifc;
Block *bp;
Etherrock *er;
ifc = a;
er = ifc->arg;
er->read6p = up; /* hide identity under a rock for unbind */
if(waserror()){
er->read6p = 0;
pexit("hangup", 1);
}
for(;;){
bp = er->mchan6->dev->bread(er->mchan6, ifc->maxtu, 0);
if(!canrlock(ifc)){
freeb(bp);
continue;
}
if(waserror()){
runlock(ifc);
nexterror();
}
ifc->in++;
if(ifc->lifc == nil || BLEN(bp) <= ifc->medium->hsize)
freeb(bp);
else {
bp->rp += ifc->medium->hsize;
ipiput6(er->f, ifc, bp);
}
runlock(ifc);
poperror();
}
}
static void
etheraddmulti(Ipifc *ifc, uint8_t *a, uint8_t * _1)
{
uint8_t mac[6];
char buf[64];
Etherrock *er = ifc->arg;
int version;
version = multicastea(mac, a);
jehanne_sprint(buf, "addmulti %E", mac);
switch(version){
case V4:
er->cchan4->dev->write(er->cchan4, buf, jehanne_strlen(buf), 0);
break;
case V6:
er->cchan6->dev->write(er->cchan6, buf, jehanne_strlen(buf), 0);
break;
default:
panic("etheraddmulti: version %d", version);
}
}
static void
etherremmulti(Ipifc *ifc, uint8_t *a, uint8_t * _1)
{
uint8_t mac[6];
char buf[64];
Etherrock *er = ifc->arg;
int version;
version = multicastea(mac, a);
jehanne_sprint(buf, "remmulti %E", mac);
switch(version){
case V4:
er->cchan4->dev->write(er->cchan4, buf, jehanne_strlen(buf), 0);
break;
case V6:
er->cchan6->dev->write(er->cchan6, buf, jehanne_strlen(buf), 0);
break;
default:
panic("etherremmulti: version %d", version);
}
}
/*
* send an ethernet arp
* (only v4, v6 uses the neighbor discovery, rfc1970)
*/
static void
sendarp(Ipifc *ifc, Arpent *a)
{
int n;
Block *bp;
Etherarp *e;
Etherrock *er = ifc->arg;
/* don't do anything if it's been less than a second since the last */
if(NOW - a->ctime < 1000){
arprelease(er->f->arp, a);
return;
}
/* remove all but the last message */
while((bp = a->hold) != nil){
if(bp == a->last)
break;
a->hold = bp->list;
freeblist(bp);
}
/* try to keep it around for a second more */
a->ctime = NOW;
arprelease(er->f->arp, a);
n = sizeof(Etherarp);
if(n < a->type->mintu)
n = a->type->mintu;
bp = allocb(n);
jehanne_memset(bp->rp, 0, n);
e = (Etherarp*)bp->rp;
jehanne_memmove(e->tpa, a->ip+IPv4off, sizeof(e->tpa));
ipv4local(ifc, e->spa);
jehanne_memmove(e->sha, ifc->mac, sizeof(e->sha));
jehanne_memset(e->d, 0xff, sizeof(e->d)); /* ethernet broadcast */
jehanne_memmove(e->s, ifc->mac, sizeof(e->s));
hnputs(e->type, ETARP);
hnputs(e->hrd, 1);
hnputs(e->pro, ETIP4);
e->hln = sizeof(e->sha);
e->pln = sizeof(e->spa);
hnputs(e->op, ARPREQUEST);
bp->wp += n;
er->achan->dev->bwrite(er->achan, bp, 0);
}
static void
resolveaddr6(Ipifc *ifc, Arpent *a)
{
int sflag;
Block *bp;
Etherrock *er = ifc->arg;
uint8_t ipsrc[IPaddrlen];
/* don't do anything if it's been less than a second since the last */
if(NOW - a->ctime < ReTransTimer){
arprelease(er->f->arp, a);
return;
}
/* remove all but the last message */
while((bp = a->hold) != nil){
if(bp == a->last)
break;
a->hold = bp->list;
freeblist(bp);
}
/* try to keep it around for a second more */
a->ctime = NOW;
a->rtime = NOW + ReTransTimer;
if(a->rxtsrem <= 0) {
arprelease(er->f->arp, a);
return;
}
a->rxtsrem--;
arprelease(er->f->arp, a);
if(sflag = ipv6anylocal(ifc, ipsrc))
icmpns(er->f, ipsrc, sflag, a->ip, TARG_MULTI, ifc->mac);
}
/*
* send a gratuitous arp to refresh arp caches
*/
static void
sendgarp(Ipifc *ifc, uint8_t *ip)
{
int n;
Block *bp;
Etherarp *e;
Etherrock *er = ifc->arg;
/* don't arp for our initial non address */
if(ipcmp(ip, IPnoaddr) == 0)
return;
n = sizeof(Etherarp);
if(n < ifc->medium->mintu)
n = ifc->medium->mintu;
bp = allocb(n);
jehanne_memset(bp->rp, 0, n);
e = (Etherarp*)bp->rp;
jehanne_memmove(e->tpa, ip+IPv4off, sizeof(e->tpa));
jehanne_memmove(e->spa, ip+IPv4off, sizeof(e->spa));
jehanne_memmove(e->sha, ifc->mac, sizeof(e->sha));
jehanne_memset(e->d, 0xff, sizeof(e->d)); /* ethernet broadcast */
jehanne_memmove(e->s, ifc->mac, sizeof(e->s));
hnputs(e->type, ETARP);
hnputs(e->hrd, 1);
hnputs(e->pro, ETIP4);
e->hln = sizeof(e->sha);
e->pln = sizeof(e->spa);
hnputs(e->op, ARPREQUEST);
bp->wp += n;
er->achan->dev->bwrite(er->achan, bp, 0);
}
static void
recvarp(Ipifc *ifc)
{
int n;
Block *ebp, *rbp;
Etherarp *e, *r;
uint8_t ip[IPaddrlen];
static uint8_t eprinted[4], nullspa[4];
Etherrock *er = ifc->arg;
ebp = er->achan->dev->bread(er->achan, ifc->maxtu, 0);
if(ebp == nil)
return;
e = (Etherarp*)ebp->rp;
switch(nhgets(e->op)) {
default:
break;
case ARPREPLY:
/* check for machine using my ip address */
v4tov6(ip, e->spa);
if(iplocalonifc(ifc, ip) || ipproxyifc(er->f, ifc, ip)){
if(jehanne_memcmp(e->sha, ifc->mac, sizeof(e->sha)) != 0){
jehanne_print("arprep: 0x%E/0x%E also has ip addr %V\n",
e->s, e->sha, e->spa);
break;
}
}
/* make sure we're not entering broadcast addresses */
if(ipcmp(ip, ipbroadcast) == 0 ||
!jehanne_memcmp(e->sha, etherbroadcast, sizeof(e->sha))){
jehanne_print("arprep: 0x%E/0x%E cannot register broadcast address %I\n",
e->s, e->sha, e->spa);
break;
}
arpenter(er->f, V4, e->spa, e->sha, sizeof(e->sha), 0);
break;
case ARPREQUEST:
/* don't answer arps till we know who we are */
if(ifc->lifc == 0)
break;
/* check for machine using my ip or ether address */
v4tov6(ip, e->spa);
if(iplocalonifc(ifc, ip) || ipproxyifc(er->f, ifc, ip)){
if(jehanne_memcmp(e->sha, ifc->mac, sizeof(e->sha)) != 0){
if (jehanne_memcmp(eprinted, e->spa, sizeof(e->spa))){
/* print only once */
jehanne_print("arpreq: 0x%E also has ip addr %V\n", e->sha, e->spa);
jehanne_memmove(eprinted, e->spa, sizeof(e->spa));
}
}
} else {
if(jehanne_memcmp(e->sha, ifc->mac, sizeof(e->sha)) == 0){
/* Ignore ARP probes from ourself. */
if(jehanne_memcmp(e->spa, nullspa, sizeof(e->spa)) != 0)
jehanne_print("arpreq: %V also has ether addr %E\n", e->spa, e->sha);
break;
}
}
/* refresh what we know about sender */
arpenter(er->f, V4, e->spa, e->sha, sizeof(e->sha), 1);
/* answer only requests for our address or systems we're proxying for */
v4tov6(ip, e->tpa);
if(!iplocalonifc(ifc, ip))
if(!ipproxyifc(er->f, ifc, ip))
break;
n = sizeof(Etherarp);
if(n < ifc->mintu)
n = ifc->mintu;
rbp = allocb(n);
r = (Etherarp*)rbp->rp;
jehanne_memset(r, 0, sizeof(Etherarp));
hnputs(r->type, ETARP);
hnputs(r->hrd, 1);
hnputs(r->pro, ETIP4);
r->hln = sizeof(r->sha);
r->pln = sizeof(r->spa);
hnputs(r->op, ARPREPLY);
jehanne_memmove(r->tha, e->sha, sizeof(r->tha));
jehanne_memmove(r->tpa, e->spa, sizeof(r->tpa));
jehanne_memmove(r->sha, ifc->mac, sizeof(r->sha));
jehanne_memmove(r->spa, e->tpa, sizeof(r->spa));
jehanne_memmove(r->d, e->sha, sizeof(r->d));
jehanne_memmove(r->s, ifc->mac, sizeof(r->s));
rbp->wp += n;
er->achan->dev->bwrite(er->achan, rbp, 0);
}
freeb(ebp);
}
static void
recvarpproc(void *v)
{
Ipifc *ifc = v;
Etherrock *er = ifc->arg;
er->arpp = up;
if(waserror()){
er->arpp = 0;
pexit("hangup", 1);
}
for(;;)
recvarp(ifc);
}
static int
multicastea(uint8_t *ea, uint8_t *ip)
{
int x;
switch(x = ipismulticast(ip)){
case V4:
ea[0] = 0x01;
ea[1] = 0x00;
ea[2] = 0x5e;
ea[3] = ip[13] & 0x7f;
ea[4] = ip[14];
ea[5] = ip[15];
break;
case V6:
ea[0] = 0x33;
ea[1] = 0x33;
ea[2] = ip[12];
ea[3] = ip[13];
ea[4] = ip[14];
ea[5] = ip[15];
break;
}
return x;
}
/*
* fill in an arp entry for broadcast or multicast
* addresses. Return the first queued packet for the
* IP address.
*/
static Block*
multicastarp(Fs *f, Arpent *a, Medium *medium, uint8_t *mac)
{
/* is it broadcast? */
switch(ipforme(f, a->ip)){
case Runi:
return nil;
case Rbcast:
jehanne_memset(mac, 0xff, 6);
return arpresolve(f->arp, a, medium, mac);
default:
break;
}
/* if multicast, fill in mac */
switch(multicastea(mac, a->ip)){
case V4:
case V6:
return arpresolve(f->arp, a, medium, mac);
}
/* let arp take care of it */
return nil;
}
void
ethermediumlink(void)
{
addipmedium(&ethermedium);
addipmedium(&gbemedium);
}
static void
etherpref2addr(uint8_t *pref, uint8_t *ea)
{
pref[8] = ea[0] | 0x2;
pref[9] = ea[1];
pref[10] = ea[2];
pref[11] = 0xFF;
pref[12] = 0xFE;
pref[13] = ea[3];
pref[14] = ea[4];
pref[15] = ea[5];
}