mountd: prepend '$' to make use_ipaddr clients self-describing
[nfs-utils.git] / utils / mountd / cache.c
1
2 /*
3  * Handle communication with knfsd internal cache
4  *
5  * We open /proc/net/rpc/{auth.unix.ip,nfsd.export,nfsd.fh}/channel
6  * and listen for requests (using my_svc_run)
7  * 
8  */
9
10 #ifdef HAVE_CONFIG_H
11 #include <config.h>
12 #endif
13
14 #include <sys/types.h>
15 #include <sys/select.h>
16 #include <sys/stat.h>
17 #include <sys/vfs.h>
18 #include <time.h>
19 #include <netinet/in.h>
20 #include <arpa/inet.h>
21 #include <unistd.h>
22 #include <fcntl.h>
23 #include <errno.h>
24 #include <ctype.h>
25 #include <pwd.h>
26 #include <grp.h>
27 #include <mntent.h>
28 #include "misc.h"
29 #include "nfslib.h"
30 #include "exportfs.h"
31 #include "mountd.h"
32 #include "xmalloc.h"
33 #include "fsloc.h"
34 #include "pseudoflavors.h"
35
36 #ifdef USE_BLKID
37 #include "blkid/blkid.h"
38 #endif
39
40 /*
41  * Invoked by RPC service loop
42  */
43 void    cache_set_fds(fd_set *fdset);
44 int     cache_process_req(fd_set *readfds);
45
46 enum nfsd_fsid {
47         FSID_DEV = 0,
48         FSID_NUM,
49         FSID_MAJOR_MINOR,
50         FSID_ENCODE_DEV,
51         FSID_UUID4_INUM,
52         FSID_UUID8,
53         FSID_UUID16,
54         FSID_UUID16_INUM,
55 };
56
57 /*
58  * Support routines for text-based upcalls.
59  * Fields are separated by spaces.
60  * Fields are either mangled to quote space tab newline slosh with slosh
61  * or a hexified with a leading \x
62  * Record is terminated with newline.
63  *
64  */
65 static int cache_export_ent(char *domain, struct exportent *exp, char *p);
66
67 #define INITIAL_MANAGED_GROUPS 100
68
69 char *lbuf  = NULL;
70 int lbuflen = 0;
71 extern int use_ipaddr;
72
73 static void auth_unix_ip(FILE *f)
74 {
75         /* requests are
76          *  class IP-ADDR
77          * Ignore if class != "nfsd"
78          * Otherwise find domainname and write back:
79          *
80          *  "nfsd" IP-ADDR expiry domainname
81          */
82         char *cp;
83         char class[20];
84         char ipaddr[INET6_ADDRSTRLEN];
85         char *client = NULL;
86         struct addrinfo *tmp = NULL;
87         struct addrinfo *ai = NULL;
88         if (readline(fileno(f), &lbuf, &lbuflen) != 1)
89                 return;
90
91         xlog(D_CALL, "auth_unix_ip: inbuf '%s'", lbuf);
92
93         cp = lbuf;
94
95         if (qword_get(&cp, class, 20) <= 0 ||
96             strcmp(class, "nfsd") != 0)
97                 return;
98
99         if (qword_get(&cp, ipaddr, sizeof(ipaddr)) <= 0)
100                 return;
101
102         tmp = host_pton(ipaddr);
103         if (tmp == NULL)
104                 return;
105
106         auth_reload();
107
108         /* addr is a valid, interesting address, find the domain name... */
109         if (!use_ipaddr) {
110                 ai = client_resolve(tmp->ai_addr);
111                 client = client_compose(ai);
112                 freeaddrinfo(ai);
113         }
114         freeaddrinfo(tmp);
115
116         qword_print(f, "nfsd");
117         qword_print(f, ipaddr);
118         qword_printuint(f, time(0) + DEFAULT_TTL);
119         if (use_ipaddr)
120                 qword_print(f, ipaddr);
121         else if (client)
122                 qword_print(f, *client?client:"DEFAULT");
123         qword_eol(f);
124         xlog(D_CALL, "auth_unix_ip: client %p '%s'", client, client?client: "DEFAULT");
125
126         free(client);
127 }
128
129 static void auth_unix_gid(FILE *f)
130 {
131         /* Request are
132          *  uid
133          * reply is
134          *  uid expiry count list of group ids
135          */
136         uid_t uid;
137         struct passwd *pw;
138         static gid_t *groups = NULL;
139         static int groups_len = 0;
140         gid_t *more_groups;
141         int ngroups;
142         int rv, i;
143         char *cp;
144
145         if (groups_len == 0) {
146                 groups = malloc(sizeof(gid_t) * INITIAL_MANAGED_GROUPS);
147                 if (!groups)
148                         return;
149
150                 groups_len = INITIAL_MANAGED_GROUPS;
151         }
152
153         ngroups = groups_len;
154
155         if (readline(fileno(f), &lbuf, &lbuflen) != 1)
156                 return;
157
158         cp = lbuf;
159         if (qword_get_uint(&cp, &uid) != 0)
160                 return;
161
162         pw = getpwuid(uid);
163         if (!pw)
164                 rv = -1;
165         else {
166                 rv = getgrouplist(pw->pw_name, pw->pw_gid, groups, &ngroups);
167                 if (rv == -1 && ngroups >= groups_len) {
168                         more_groups = realloc(groups, sizeof(gid_t)*ngroups);
169                         if (!more_groups)
170                                 rv = -1;
171                         else {
172                                 groups = more_groups;
173                                 groups_len = ngroups;
174                                 rv = getgrouplist(pw->pw_name, pw->pw_gid,
175                                                   groups, &ngroups);
176                         }
177                 }
178         }
179         qword_printuint(f, uid);
180         qword_printuint(f, time(0) + DEFAULT_TTL);
181         if (rv >= 0) {
182                 qword_printuint(f, ngroups);
183                 for (i=0; i<ngroups; i++)
184                         qword_printuint(f, groups[i]);
185         } else
186                 qword_printuint(f, 0);
187         qword_eol(f);
188 }
189
190 #if USE_BLKID
191 static const char *get_uuid_blkdev(char *path)
192 {
193         /* We set *safe if we know that we need the
194          * fsid from statfs too.
195          */
196         static blkid_cache cache = NULL;
197         struct stat stb;
198         char *devname;
199         blkid_tag_iterate iter;
200         blkid_dev dev;
201         const char *type;
202         const char *val, *uuid = NULL;
203
204         if (cache == NULL)
205                 blkid_get_cache(&cache, NULL);
206
207         if (stat(path, &stb) != 0)
208                 return NULL;
209         devname = blkid_devno_to_devname(stb.st_dev);
210         if (!devname)
211                 return NULL;
212         dev = blkid_get_dev(cache, devname, BLKID_DEV_NORMAL);
213         free(devname);
214         if (!dev)
215                 return NULL;
216         iter = blkid_tag_iterate_begin(dev);
217         if (!iter)
218                 return NULL;
219         while (blkid_tag_next(iter, &type, &val) == 0) {
220                 if (strcmp(type, "UUID") == 0)
221                         uuid = val;
222                 if (strcmp(type, "TYPE") == 0 &&
223                     strcmp(val, "btrfs") == 0) {
224                         uuid = NULL;
225                         break;
226                 }
227         }
228         blkid_tag_iterate_end(iter);
229         return uuid;
230 }
231 #else
232 #define get_uuid_blkdev(path) (NULL)
233 #endif
234
235 static int get_uuid(const char *val, int uuidlen, char *u)
236 {
237         /* extract hex digits from uuidstr and compose a uuid
238          * of the given length (max 16), xoring bytes to make
239          * a smaller uuid.
240          */
241         int i = 0;
242         
243         memset(u, 0, uuidlen);
244         for ( ; *val ; val++) {
245                 char c = *val;
246                 if (!isxdigit(c))
247                         continue;
248                 if (isalpha(c)) {
249                         if (isupper(c))
250                                 c = c - 'A' + 10;
251                         else
252                                 c = c - 'a' + 10;
253                 } else
254                         c = c - '0' + 0;
255                 if ((i&1) == 0)
256                         c <<= 4;
257                 u[i/2] ^= c;
258                 i++;
259                 if (i == uuidlen*2)
260                         i = 0;
261         }
262         return 1;
263 }
264
265 static int uuid_by_path(char *path, int type, int uuidlen, char *uuid)
266 {
267         /* get a uuid for the filesystem found at 'path'.
268          * There are several possible ways of generating the
269          * uuids (types).
270          * Type 0 is used for new filehandles, while other types
271          * may be used to interpret old filehandle - to ensure smooth
272          * forward migration.
273          * We return 1 if a uuid was found (and it might be worth 
274          * trying the next type) or 0 if no more uuid types can be
275          * extracted.
276          */
277
278         /* Possible sources of uuid are
279          * - blkid uuid
280          * - statfs64 uuid
281          *
282          * On some filesystems (e.g. vfat) the statfs64 uuid is simply an
283          * encoding of the device that the filesystem is mounted from, so
284          * it we be very bad to use that (as device numbers change).  blkid
285          * must be preferred.
286          * On other filesystems (e.g. btrfs) the statfs64 uuid contains
287          * important info that the blkid uuid cannot contain:  This happens
288          * when multiple subvolumes are exported (they have the same
289          * blkid uuid but different statfs64 uuids).
290          * We rely on get_uuid_blkdev *knowing* which is which and not returning
291          * a uuid for filesystems where the statfs64 uuid is better.
292          *
293          */
294         struct statfs64 st;
295         char fsid_val[17];
296         const char *blkid_val;
297         const char *val;
298
299         blkid_val = get_uuid_blkdev(path);
300
301         if (statfs64(path, &st) == 0 &&
302             (st.f_fsid.__val[0] || st.f_fsid.__val[1]))
303                 snprintf(fsid_val, 17, "%08x%08x",
304                          st.f_fsid.__val[0], st.f_fsid.__val[1]);
305         else
306                 fsid_val[0] = 0;
307
308         if (blkid_val && (type--) == 0)
309                 val = blkid_val;
310         else if (fsid_val[0] && (type--) == 0)
311                 val = fsid_val;
312         else
313                 return 0;
314
315         get_uuid(val, uuidlen, uuid);
316         return 1;
317 }
318
319 /* Iterate through /etc/mtab, finding mountpoints
320  * at or below a given path
321  */
322 static char *next_mnt(void **v, char *p)
323 {
324         FILE *f;
325         struct mntent *me;
326         int l = strlen(p);
327         if (*v == NULL) {
328                 f = setmntent("/etc/mtab", "r");
329                 *v = f;
330         } else
331                 f = *v;
332         while ((me = getmntent(f)) != NULL &&
333                (strncmp(me->mnt_dir, p, l) != 0 ||
334                 me->mnt_dir[l] != '/'))
335                 ;
336         if (me == NULL) {
337                 endmntent(f);
338                 *v = NULL;
339                 return NULL;
340         }
341         return me->mnt_dir;
342 }
343
344 /* True iff e1 is a child of e2 and e2 has crossmnt set: */
345 static bool subexport(struct exportent *e1, struct exportent *e2)
346 {
347         char *p1 = e1->e_path, *p2 = e2->e_path;
348         int l2 = strlen(p2);
349
350         return e2->e_flags & NFSEXP_CROSSMOUNT
351                && strncmp(p1, p2, l2) == 0
352                && p1[l2] == '/';
353 }
354
355 struct parsed_fsid {
356         int fsidtype;
357         /* We could use a union for this, but it would be more
358          * complicated; why bother? */
359         unsigned int inode;
360         unsigned int minor;
361         unsigned int major;
362         unsigned int fsidnum;
363         int uuidlen;
364         char *fhuuid;
365 };
366
367 int parse_fsid(int fsidtype, int fsidlen, char *fsid, struct parsed_fsid *parsed)
368 {
369         unsigned int dev;
370         unsigned long long inode64;
371
372         parsed->fsidtype = fsidtype;
373         switch(fsidtype) {
374         case FSID_DEV: /* 4 bytes: 2 major, 2 minor, 4 inode */
375                 if (fsidlen != 8)
376                         return -1;
377                 memcpy(&dev, fsid, 4);
378                 memcpy(&parsed->inode, fsid+4, 4);
379                 parsed->major = ntohl(dev)>>16;
380                 parsed->minor = ntohl(dev) & 0xFFFF;
381                 break;
382
383         case FSID_NUM: /* 4 bytes - fsid */
384                 if (fsidlen != 4)
385                         return -1;
386                 memcpy(&parsed->fsidnum, fsid, 4);
387                 break;
388
389         case FSID_MAJOR_MINOR: /* 12 bytes: 4 major, 4 minor, 4 inode 
390                  * This format is never actually used but was
391                  * an historical accident
392                  */
393                 if (fsidlen != 12)
394                         return -1;
395                 memcpy(&dev, fsid, 4);
396                 parsed->major = ntohl(dev);
397                 memcpy(&dev, fsid+4, 4);
398                 parsed->minor = ntohl(dev);
399                 memcpy(&parsed->inode, fsid+8, 4);
400                 break;
401
402         case FSID_ENCODE_DEV: /* 8 bytes: 4 byte packed device number, 4 inode */
403                 /* This is *host* endian, not net-byte-order, because
404                  * no-one outside this host has any business interpreting it
405                  */
406                 if (fsidlen != 8)
407                         return -1;
408                 memcpy(&dev, fsid, 4);
409                 memcpy(&parsed->inode, fsid+4, 4);
410                 parsed->major = (dev & 0xfff00) >> 8;
411                 parsed->minor = (dev & 0xff) | ((dev >> 12) & 0xfff00);
412                 break;
413
414         case FSID_UUID4_INUM: /* 4 byte inode number and 4 byte uuid */
415                 if (fsidlen != 8)
416                         return -1;
417                 memcpy(&parsed->inode, fsid, 4);
418                 parsed->uuidlen = 4;
419                 parsed->fhuuid = fsid+4;
420                 break;
421         case FSID_UUID8: /* 8 byte uuid */
422                 if (fsidlen != 8)
423                         return -1;
424                 parsed->uuidlen = 8;
425                 parsed->fhuuid = fsid;
426                 break;
427         case FSID_UUID16: /* 16 byte uuid */
428                 if (fsidlen != 16)
429                         return -1;
430                 parsed->uuidlen = 16;
431                 parsed->fhuuid = fsid;
432                 break;
433         case FSID_UUID16_INUM: /* 8 byte inode number and 16 byte uuid */
434                 if (fsidlen != 24)
435                         return -1;
436                 memcpy(&inode64, fsid, 8);
437                 parsed->inode = inode64;
438                 parsed->uuidlen = 16;
439                 parsed->fhuuid = fsid+8;
440                 break;
441         }
442         return 0;
443 }
444
445 static bool match_fsid(struct parsed_fsid *parsed, nfs_export *exp, char *path)
446 {
447         struct stat stb;
448         int type;
449         char u[16];
450
451         if (stat(path, &stb) != 0)
452                 return false;
453         if (!S_ISDIR(stb.st_mode) && !S_ISREG(stb.st_mode))
454                 return false;
455
456         switch (parsed->fsidtype) {
457         case FSID_DEV:
458         case FSID_MAJOR_MINOR:
459         case FSID_ENCODE_DEV:
460                 if (stb.st_ino != parsed->inode)
461                         return false;
462                 if (parsed->major != major(stb.st_dev) ||
463                     parsed->minor != minor(stb.st_dev))
464                         return false;
465                 return true;
466         case FSID_NUM:
467                 if (((exp->m_export.e_flags & NFSEXP_FSID) == 0 ||
468                      exp->m_export.e_fsid != parsed->fsidnum))
469                         return false;
470                 return true;
471         case FSID_UUID4_INUM:
472         case FSID_UUID16_INUM:
473                 if (stb.st_ino != parsed->inode)
474                         return false;
475                 goto check_uuid;
476         case FSID_UUID8:
477         case FSID_UUID16:
478                 if (!is_mountpoint(path))
479                         return false;
480         check_uuid:
481                 if (exp->m_export.e_uuid)
482                         get_uuid(exp->m_export.e_uuid, parsed->uuidlen, u);
483                 else
484                         for (type = 0;
485                              uuid_by_path(path, type, parsed->uuidlen, u);
486                              type++)
487                                 if (memcmp(u, parsed->fhuuid, parsed->uuidlen) == 0)
488                                         return true;
489
490                 if (memcmp(u, parsed->fhuuid, parsed->uuidlen) != 0)
491                         return false;
492                 return true;
493         }
494         /* Well, unreachable, actually: */
495         return false;
496 }
497
498 struct addrinfo *lookup_client_addr(char *dom)
499 {
500         struct addrinfo *ret;
501         struct addrinfo *tmp;
502
503         dom++; /* skip initial "$" */
504
505         tmp = host_pton(dom);
506         if (tmp == NULL)
507                 return NULL;
508         ret = client_resolve(tmp->ai_addr);
509         freeaddrinfo(tmp);
510         return ret;
511 }
512
513 static void nfsd_fh(FILE *f)
514 {
515         /* request are:
516          *  domain fsidtype fsid
517          * interpret fsid, find export point and options, and write:
518          *  domain fsidtype fsid expiry path
519          */
520         char *cp;
521         char *dom;
522         int fsidtype;
523         int fsidlen;
524         char fsid[32];
525         struct parsed_fsid parsed;
526         struct exportent *found = NULL;
527         struct addrinfo *ai = NULL;
528         char *found_path = NULL;
529         nfs_export *exp;
530         int i;
531         int dev_missing = 0;
532
533         if (readline(fileno(f), &lbuf, &lbuflen) != 1)
534                 return;
535
536         xlog(D_CALL, "nfsd_fh: inbuf '%s'", lbuf);
537
538         cp = lbuf;
539
540         dom = malloc(strlen(cp));
541         if (dom == NULL)
542                 return;
543         if (qword_get(&cp, dom, strlen(cp)) <= 0)
544                 goto out;
545         if (qword_get_int(&cp, &fsidtype) != 0)
546                 goto out;
547         if (fsidtype < 0 || fsidtype > 7)
548                 goto out; /* unknown type */
549         if ((fsidlen = qword_get(&cp, fsid, 32)) <= 0)
550                 goto out;
551         if (parse_fsid(fsidtype, fsidlen, fsid, &parsed))
552                 goto out;
553
554         auth_reload();
555
556         if (is_ipaddr_client(dom)) {
557                 ai = lookup_client_addr(dom);
558                 if (!ai)
559                         goto out;
560         }
561
562         /* Now determine export point for this fsid/domain */
563         for (i=0 ; i < MCL_MAXTYPES; i++) {
564                 nfs_export *next_exp;
565                 for (exp = exportlist[i].p_head; exp; exp = next_exp) {
566                         char *path;
567
568                         if (exp->m_export.e_flags & NFSEXP_CROSSMOUNT) {
569                                 static nfs_export *prev = NULL;
570                                 static void *mnt = NULL;
571                                 
572                                 if (prev == exp) {
573                                         /* try a submount */
574                                         path = next_mnt(&mnt, exp->m_export.e_path);
575                                         if (!path) {
576                                                 next_exp = exp->m_next;
577                                                 prev = NULL;
578                                                 continue;
579                                         }
580                                         next_exp = exp;
581                                 } else {
582                                         prev = exp;
583                                         mnt = NULL;
584                                         path = exp->m_export.e_path;
585                                         next_exp = exp;
586                                 }
587                         } else {
588                                 path = exp->m_export.e_path;
589                                 next_exp = exp->m_next;
590                         }
591
592                         if (!is_ipaddr_client(dom)
593                                         && !namelist_client_matches(exp, dom))
594                                 continue;
595                         if (exp->m_export.e_mountpoint &&
596                             !is_mountpoint(exp->m_export.e_mountpoint[0]?
597                                            exp->m_export.e_mountpoint:
598                                            exp->m_export.e_path))
599                                 dev_missing ++;
600
601                         if (!match_fsid(&parsed, exp, path))
602                                 continue;
603                         if (is_ipaddr_client(dom)
604                                         && !ipaddr_client_matches(exp, ai))
605                                 continue;
606                         if (!found || subexport(&exp->m_export, found)) {
607                                 found = &exp->m_export;
608                                 free(found_path);
609                                 found_path = strdup(path);
610                                 if (found_path == NULL)
611                                         goto out;
612                         } else if (strcmp(found->e_path, exp->m_export.e_path) != 0
613                                    && !subexport(found, &exp->m_export))
614                         {
615                                 xlog(L_WARNING, "%s and %s have same filehandle for %s, using first",
616                                      found_path, path, dom);
617                         } else {
618                                 /* same path, if one is V4ROOT, choose the other */
619                                 if (found->e_flags & NFSEXP_V4ROOT) {
620                                         found = &exp->m_export;
621                                         free(found_path);
622                                         found_path = strdup(path);
623                                         if (found_path == NULL)
624                                                 goto out;
625                                 }
626                         }
627                 }
628         }
629         if (found && 
630             found->e_mountpoint &&
631             !is_mountpoint(found->e_mountpoint[0]?
632                            found->e_mountpoint:
633                            found->e_path)) {
634                 /* Cannot export this yet 
635                  * should log a warning, but need to rate limit
636                    xlog(L_WARNING, "%s not exported as %d not a mountpoint",
637                    found->e_path, found->e_mountpoint);
638                  */
639                 /* FIXME we need to make sure we re-visit this later */
640                 goto out;
641         }
642         if (!found && dev_missing) {
643                 /* The missing dev could be what we want, so just be
644                  * quite rather than returning stale yet
645                  */
646                 goto out;
647         }
648
649         if (found)
650                 if (cache_export_ent(dom, found, found_path) < 0)
651                         found = 0;
652
653         qword_print(f, dom);
654         qword_printint(f, fsidtype);
655         qword_printhex(f, fsid, fsidlen);
656         /* The fsid -> path lookup can be quite expensive as it
657          * potentially stats and reads lots of devices, and some of those
658          * might have spun-down.  The Answer is not likely to
659          * change underneath us, and an 'exportfs -f' can always
660          * remove this from the kernel, so use a really log
661          * timeout.  Maybe this should be configurable on the command
662          * line.
663          */
664         qword_printint(f, 0x7fffffff);
665         if (found)
666                 qword_print(f, found_path);
667         qword_eol(f);
668  out:
669         if (found_path)
670                 free(found_path);
671         freeaddrinfo(ai);
672         free(dom);
673         xlog(D_CALL, "nfsd_fh: found %p path %s", found, found ? found->e_path : NULL);
674         return;         
675 }
676
677 static void write_fsloc(FILE *f, struct exportent *ep)
678 {
679         struct servers *servers;
680
681         if (ep->e_fslocmethod == FSLOC_NONE)
682                 return;
683
684         servers = replicas_lookup(ep->e_fslocmethod, ep->e_fslocdata);
685         if (!servers)
686                 return;
687         qword_print(f, "fsloc");
688         qword_printint(f, servers->h_num);
689         if (servers->h_num >= 0) {
690                 int i;
691                 for (i=0; i<servers->h_num; i++) {
692                         qword_print(f, servers->h_mp[i]->h_host);
693                         qword_print(f, servers->h_mp[i]->h_path);
694                 }
695         }
696         qword_printint(f, servers->h_referral);
697         release_replicas(servers);
698 }
699
700 static void write_secinfo(FILE *f, struct exportent *ep, int flag_mask)
701 {
702         struct sec_entry *p;
703
704         for (p = ep->e_secinfo; p->flav; p++)
705                 ; /* Do nothing */
706         if (p == ep->e_secinfo) {
707                 /* There was no sec= option */
708                 return;
709         }
710         qword_print(f, "secinfo");
711         qword_printint(f, p - ep->e_secinfo);
712         for (p = ep->e_secinfo; p->flav; p++) {
713                 qword_printint(f, p->flav->fnum);
714                 qword_printint(f, p->flags & flag_mask);
715         }
716
717 }
718
719 static int dump_to_cache(FILE *f, char *domain, char *path, struct exportent *exp)
720 {
721         qword_print(f, domain);
722         qword_print(f, path);
723         if (exp) {
724                 int different_fs = strcmp(path, exp->e_path) != 0;
725                 int flag_mask = different_fs ? ~NFSEXP_FSID : ~0;
726
727                 qword_printuint(f, time(0) + exp->e_ttl);
728                 qword_printint(f, exp->e_flags & flag_mask);
729                 qword_printint(f, exp->e_anonuid);
730                 qword_printint(f, exp->e_anongid);
731                 qword_printint(f, exp->e_fsid);
732                 write_fsloc(f, exp);
733                 write_secinfo(f, exp, flag_mask);
734                 if (exp->e_uuid == NULL || different_fs) {
735                         char u[16];
736                         if (uuid_by_path(path, 0, 16, u)) {
737                                 qword_print(f, "uuid");
738                                 qword_printhex(f, u, 16);
739                         }
740                 } else {
741                         char u[16];
742                         get_uuid(exp->e_uuid, 16, u);
743                         qword_print(f, "uuid");
744                         qword_printhex(f, u, 16);
745                 }
746         } else
747                 qword_printuint(f, time(0) + DEFAULT_TTL);
748         return qword_eol(f);
749 }
750
751 static int is_subdirectory(char *child, char *parent)
752 {
753         int l = strlen(parent);
754
755         return strcmp(child, parent) == 0
756                 || (strncmp(child, parent, l) == 0 && child[l] == '/');
757 }
758
759 static int path_matches(nfs_export *exp, char *path)
760 {
761         if (exp->m_export.e_flags & NFSEXP_CROSSMOUNT)
762                 return is_subdirectory(path, exp->m_export.e_path);
763         return strcmp(path, exp->m_export.e_path) == 0;
764 }
765
766 static int
767 export_matches(nfs_export *exp, char *dom, char *path, struct addrinfo *ai)
768 {
769         return path_matches(exp, path) && client_matches(exp, dom, ai);
770 }
771
772 static nfs_export *
773 lookup_export(char *dom, char *path, struct addrinfo *ai)
774 {
775         nfs_export *exp;
776         nfs_export *found = NULL;
777         int found_type = 0;
778         int i;
779
780         for (i=0 ; i < MCL_MAXTYPES; i++) {
781                 for (exp = exportlist[i].p_head; exp; exp = exp->m_next) {
782                         if (!export_matches(exp, dom, path, ai))
783                                 continue;
784                         if (!found) {
785                                 found = exp;
786                                 found_type = i;
787                                 continue;
788                         }
789                         /* Always prefer non-V4ROOT exports */
790                         if (exp->m_export.e_flags & NFSEXP_V4ROOT)
791                                 continue;
792                         if (found->m_export.e_flags & NFSEXP_V4ROOT) {
793                                 found = exp;
794                                 found_type = i;
795                                 continue;
796                         }
797
798                         /* If one is a CROSSMOUNT, then prefer the longest path */
799                         if (((found->m_export.e_flags & NFSEXP_CROSSMOUNT) ||
800                              (exp->m_export.e_flags & NFSEXP_CROSSMOUNT)) &&
801                             strlen(found->m_export.e_path) !=
802                             strlen(exp->m_export.e_path)) {
803
804                                 if (strlen(exp->m_export.e_path) >
805                                     strlen(found->m_export.e_path)) {
806                                         found = exp;
807                                         found_type = i;
808                                 }
809                                 continue;
810
811                         } else if (found_type == i && found->m_warned == 0) {
812                                 xlog(L_WARNING, "%s exported to both %s and %s, "
813                                      "arbitrarily choosing options from first",
814                                      path, found->m_client->m_hostname, exp->m_client->m_hostname,
815                                      dom);
816                                 found->m_warned = 1;
817                         }
818                 }
819         }
820         return found;
821 }
822
823 #ifdef HAVE_NFS_PLUGIN_H
824 #include <dlfcn.h>
825 #include <nfs-plugin.h>
826
827 /*
828  * Walk through a set of FS locations and build a set of export options.
829  * Returns true if all went to plan; otherwise, false.
830  */
831 static _Bool
832 locations_to_options(struct jp_ops *ops, nfs_fsloc_set_t locations,
833                 char *options, size_t remaining, int *ttl)
834 {
835         char *server, *last_path, *rootpath, *ptr;
836         _Bool seen = false;
837
838         last_path = NULL;
839         rootpath = NULL;
840         server = NULL;
841         ptr = options;
842         *ttl = 0;
843
844         for (;;) {
845                 enum jp_status status;
846                 int len;
847
848                 status = ops->jp_get_next_location(locations, &server,
849                                                         &rootpath, ttl);
850                 if (status == JP_EMPTY)
851                         break;
852                 if (status != JP_OK) {
853                         xlog(D_GENERAL, "%s: failed to parse location: %s",
854                                 __func__, ops->jp_error(status));
855                         goto out_false;
856                 }
857                 xlog(D_GENERAL, "%s: Location: %s:%s",
858                         __func__, server, rootpath);
859
860                 if (last_path && strcmp(rootpath, last_path) == 0) {
861                         len = snprintf(ptr, remaining, "+%s", server);
862                         if (len < 0) {
863                                 xlog(D_GENERAL, "%s: snprintf: %m", __func__);
864                                 goto out_false;
865                         }
866                         if ((size_t)len >= remaining) {
867                                 xlog(D_GENERAL, "%s: options buffer overflow", __func__);
868                                 goto out_false;
869                         }
870                         remaining -= (size_t)len;
871                         ptr += len;
872                 } else {
873                         if (last_path == NULL)
874                                 len = snprintf(ptr, remaining, "refer=%s@%s",
875                                                         rootpath, server);
876                         else
877                                 len = snprintf(ptr, remaining, ":%s@%s",
878                                                         rootpath, server);
879                         if (len < 0) {
880                                 xlog(D_GENERAL, "%s: snprintf: %m", __func__);
881                                 goto out_false;
882                         }
883                         if ((size_t)len >= remaining) {
884                                 xlog(D_GENERAL, "%s: options buffer overflow",
885                                         __func__);
886                                 goto out_false;
887                         }
888                         remaining -= (size_t)len;
889                         ptr += len;
890                         last_path = rootpath;
891                 }
892
893                 seen = true;
894                 free(rootpath);
895                 free(server);
896         }
897
898         xlog(D_CALL, "%s: options='%s', ttl=%d",
899                 __func__, options, *ttl);
900         return seen;
901
902 out_false:
903         free(rootpath);
904         free(server);
905         return false;
906 }
907
908 /*
909  * Walk through the set of FS locations and build an exportent.
910  * Returns pointer to an exportent if "junction" refers to a junction.
911  *
912  * Returned exportent points to static memory.
913  */
914 static struct exportent *do_locations_to_export(struct jp_ops *ops,
915                 nfs_fsloc_set_t locations, const char *junction,
916                 char *options, size_t options_len)
917 {
918         struct exportent *exp;
919         int ttl;
920
921         if (!locations_to_options(ops, locations, options, options_len, &ttl))
922                 return NULL;
923
924         exp = mkexportent("*", (char *)junction, options);
925         if (exp == NULL) {
926                 xlog(L_ERROR, "%s: Failed to construct exportent", __func__);
927                 return NULL;
928         }
929
930         exp->e_uuid = NULL;
931         exp->e_ttl = ttl;
932         return exp;
933 }
934
935 /*
936  * Convert set of FS locations to an exportent.  Returns pointer to
937  * an exportent if "junction" refers to a junction.
938  *
939  * Returned exportent points to static memory.
940  */
941 static struct exportent *locations_to_export(struct jp_ops *ops,
942                 nfs_fsloc_set_t locations, const char *junction)
943 {
944         struct exportent *exp;
945         char *options;
946
947         options = malloc(BUFSIZ);
948         if (options == NULL) {
949                 xlog(D_GENERAL, "%s: failed to allocate options buffer",
950                         __func__);
951                 return NULL;
952         }
953         options[0] = '\0';
954
955         exp = do_locations_to_export(ops, locations, junction,
956                                                 options, BUFSIZ);
957
958         free(options);
959         return exp;
960 }
961
962 /*
963  * Retrieve locations information in "junction" and dump it to the
964  * kernel.  Returns pointer to an exportent if "junction" refers
965  * to a junction.
966  *
967  * Returned exportent points to static memory.
968  */
969 static struct exportent *invoke_junction_ops(void *handle,
970                 const char *junction)
971 {
972         nfs_fsloc_set_t locations;
973         struct exportent *exp;
974         enum jp_status status;
975         struct jp_ops *ops;
976         char *error;
977
978         ops = (struct jp_ops *)dlsym(handle, "nfs_junction_ops");
979         error = dlerror();
980         if (error != NULL) {
981                 xlog(D_GENERAL, "%s: dlsym(jp_junction_ops): %s",
982                         __func__, error);
983                 return NULL;
984         }
985         if (ops->jp_api_version != JP_API_VERSION) {
986                 xlog(D_GENERAL, "%s: unrecognized junction API version: %u",
987                         __func__, ops->jp_api_version);
988                 return NULL;
989         }
990
991         status = ops->jp_init(false);
992         if (status != JP_OK) {
993                 xlog(D_GENERAL, "%s: failed to resolve %s: %s",
994                         __func__, junction, ops->jp_error(status));
995                 return NULL;
996         }
997
998         status = ops->jp_get_locations(junction, &locations);
999         if (status != JP_OK) {
1000                 xlog(D_GENERAL, "%s: failed to resolve %s: %s",
1001                         __func__, junction, ops->jp_error(status));
1002                 return NULL;
1003         }
1004
1005         exp = locations_to_export(ops, locations, junction);
1006
1007         ops->jp_put_locations(locations);
1008         ops->jp_done();
1009         return exp;
1010 }
1011
1012 /*
1013  * Load the junction plug-in, then try to resolve "pathname".
1014  * Returns pointer to an initialized exportent if "junction"
1015  * refers to a junction, or NULL if not.
1016  *
1017  * Returned exportent points to static memory.
1018  */
1019 static struct exportent *lookup_junction(const char *pathname)
1020 {
1021         struct exportent *exp;
1022         void *handle;
1023
1024         handle = dlopen("libnfsjunct.so", RTLD_NOW);
1025         if (handle == NULL) {
1026                 xlog(D_GENERAL, "%s: dlopen: %s", __func__, dlerror());
1027                 return NULL;
1028         }
1029         (void)dlerror();        /* Clear any error */
1030
1031         exp = invoke_junction_ops(handle, pathname);
1032
1033         /* We could leave it loaded to make junction resolution
1034          * faster next time.  However, if we want to replace the
1035          * library, that would require restarting mountd. */
1036         (void)dlclose(handle);
1037         return exp;
1038 }
1039 #else   /* !HAVE_NFS_PLUGIN_H */
1040 static inline struct exportent *lookup_junction(const char *UNUSED(pathname))
1041 {
1042         return NULL;
1043 }
1044 #endif  /* !HAVE_NFS_PLUGIN_H */
1045
1046 static void nfsd_export(FILE *f)
1047 {
1048         /* requests are:
1049          *  domain path
1050          * determine export options and return:
1051          *  domain path expiry flags anonuid anongid fsid
1052          */
1053
1054         char *cp;
1055         char *dom, *path;
1056         nfs_export *found = NULL;
1057         struct addrinfo *ai = NULL;
1058
1059         if (readline(fileno(f), &lbuf, &lbuflen) != 1)
1060                 return;
1061
1062         xlog(D_CALL, "nfsd_export: inbuf '%s'", lbuf);
1063
1064         cp = lbuf;
1065         dom = malloc(strlen(cp));
1066         path = malloc(strlen(cp));
1067
1068         if (!dom || !path)
1069                 goto out;
1070
1071         if (qword_get(&cp, dom, strlen(lbuf)) <= 0)
1072                 goto out;
1073         if (qword_get(&cp, path, strlen(lbuf)) <= 0)
1074                 goto out;
1075
1076         auth_reload();
1077
1078         if (is_ipaddr_client(dom)) {
1079                 ai = lookup_client_addr(dom);
1080                 if (!ai)
1081                         goto out;
1082         }
1083
1084         found = lookup_export(dom, path, ai);
1085
1086         if (found) {
1087                 if (dump_to_cache(f, dom, path, &found->m_export) < 0) {
1088                         xlog(L_WARNING,
1089                              "Cannot export %s, possibly unsupported filesystem"
1090                              " or fsid= required", path);
1091                         dump_to_cache(f, dom, path, NULL);
1092                 }
1093         } else {
1094                 dump_to_cache(f, dom, path, lookup_junction(path));
1095         }
1096  out:
1097         xlog(D_CALL, "nfsd_export: found %p path %s", found, path ? path : NULL);
1098         if (dom) free(dom);
1099         if (path) free(path);
1100         freeaddrinfo(ai);
1101 }
1102
1103
1104 struct {
1105         char *cache_name;
1106         void (*cache_handle)(FILE *f);
1107         FILE *f;
1108         char vbuf[RPC_CHAN_BUF_SIZE];
1109 } cachelist[] = {
1110         { "auth.unix.ip", auth_unix_ip, NULL, ""},
1111         { "auth.unix.gid", auth_unix_gid, NULL, ""},
1112         { "nfsd.export", nfsd_export, NULL, ""},
1113         { "nfsd.fh", nfsd_fh, NULL, ""},
1114         { NULL, NULL, NULL, ""}
1115 };
1116
1117 extern int manage_gids;
1118
1119 /**
1120  * cache_open - prepare communications channels with kernel RPC caches
1121  *
1122  */
1123 void cache_open(void) 
1124 {
1125         int i;
1126         for (i=0; cachelist[i].cache_name; i++ ) {
1127                 char path[100];
1128                 if (!manage_gids && cachelist[i].cache_handle == auth_unix_gid)
1129                         continue;
1130                 sprintf(path, "/proc/net/rpc/%s/channel", cachelist[i].cache_name);
1131                 cachelist[i].f = fopen(path, "r+");
1132                 if (cachelist[i].f != NULL) {
1133                         setvbuf(cachelist[i].f, cachelist[i].vbuf, _IOLBF, 
1134                                 RPC_CHAN_BUF_SIZE);
1135                 }
1136         }
1137 }
1138
1139 /**
1140  * cache_set_fds - prepare cache file descriptors for one iteration of the service loop
1141  * @fdset: pointer to fd_set to prepare
1142  */
1143 void cache_set_fds(fd_set *fdset)
1144 {
1145         int i;
1146         for (i=0; cachelist[i].cache_name; i++) {
1147                 if (cachelist[i].f)
1148                         FD_SET(fileno(cachelist[i].f), fdset);
1149         }
1150 }
1151
1152 /**
1153  * cache_process_req - process any active cache file descriptors during service loop iteration
1154  * @fdset: pointer to fd_set to examine for activity
1155  */
1156 int cache_process_req(fd_set *readfds) 
1157 {
1158         int i;
1159         int cnt = 0;
1160         for (i=0; cachelist[i].cache_name; i++) {
1161                 if (cachelist[i].f != NULL &&
1162                     FD_ISSET(fileno(cachelist[i].f), readfds)) {
1163                         cnt++;
1164                         cachelist[i].cache_handle(cachelist[i].f);
1165                         FD_CLR(fileno(cachelist[i].f), readfds);
1166                 }
1167         }
1168         return cnt;
1169 }
1170
1171
1172 /*
1173  * Give IP->domain and domain+path->options to kernel
1174  * % echo nfsd $IP  $[now+DEFAULT_TTL] $domain > /proc/net/rpc/auth.unix.ip/channel
1175  * % echo $domain $path $[now+DEFAULT_TTL] $options $anonuid $anongid $fsid > /proc/net/rpc/nfsd.export/channel
1176  */
1177
1178 static int cache_export_ent(char *domain, struct exportent *exp, char *path)
1179 {
1180         int err;
1181         FILE *f = fopen("/proc/net/rpc/nfsd.export/channel", "w");
1182         if (!f)
1183                 return -1;
1184
1185         err = dump_to_cache(f, domain, exp->e_path, exp);
1186         if (err) {
1187                 xlog(L_WARNING,
1188                      "Cannot export %s, possibly unsupported filesystem or"
1189                      " fsid= required", exp->e_path);
1190         }
1191
1192         while (err == 0 && (exp->e_flags & NFSEXP_CROSSMOUNT) && path) {
1193                 /* really an 'if', but we can break out of
1194                  * a 'while' more easily */
1195                 /* Look along 'path' for other filesystems
1196                  * and export them with the same options
1197                  */
1198                 struct stat stb;
1199                 size_t l = strlen(exp->e_path);
1200                 __dev_t dev;
1201
1202                 if (strlen(path) <= l || path[l] != '/' ||
1203                     strncmp(exp->e_path, path, l) != 0)
1204                         break;
1205                 if (stat(exp->e_path, &stb) != 0)
1206                         break;
1207                 dev = stb.st_dev;
1208                 while(path[l] == '/') {
1209                         char c;
1210                         /* errors for submount should fail whole filesystem */
1211                         int err2;
1212
1213                         l++;
1214                         while (path[l] != '/' && path[l])
1215                                 l++;
1216                         c = path[l];
1217                         path[l] = 0;
1218                         err2 = lstat(path, &stb);
1219                         path[l] = c;
1220                         if (err2 < 0)
1221                                 break;
1222                         if (stb.st_dev == dev)
1223                                 continue;
1224                         dev = stb.st_dev;
1225                         path[l] = 0;
1226                         dump_to_cache(f, domain, path, exp);
1227                         path[l] = c;
1228                 }
1229                 break;
1230         }
1231
1232         fclose(f);
1233         return err;
1234 }
1235
1236 /**
1237  * cache_export - Inform kernel of a new nfs_export
1238  * @exp: target nfs_export
1239  * @path: NUL-terminated C string containing export path
1240  */
1241 int cache_export(nfs_export *exp, char *path)
1242 {
1243         char buf[INET6_ADDRSTRLEN];
1244         int err;
1245         FILE *f;
1246
1247         f = fopen("/proc/net/rpc/auth.unix.ip/channel", "w");
1248         if (!f)
1249                 return -1;
1250
1251
1252         qword_print(f, "nfsd");
1253         qword_print(f,
1254                 host_ntop(get_addrlist(exp->m_client, 0), buf, sizeof(buf)));
1255         qword_printuint(f, time(0) + exp->m_export.e_ttl);
1256         qword_print(f, exp->m_client->m_hostname);
1257         err = qword_eol(f);
1258         
1259         fclose(f);
1260
1261         err = cache_export_ent(exp->m_client->m_hostname, &exp->m_export, path)
1262                 || err;
1263         return err;
1264 }
1265
1266 /**
1267  * cache_get_filehandle - given an nfs_export, get its root filehandle
1268  * @exp: target nfs_export
1269  * @len: length of requested file handle
1270  * @p: NUL-terminated C string containing export path
1271  *
1272  * Returns pointer to NFS file handle of root directory of export
1273  *
1274  * { 
1275  *   echo $domain $path $length 
1276  *   read filehandle <&0
1277  * } <> /proc/fs/nfsd/filehandle
1278  */
1279 struct nfs_fh_len *
1280 cache_get_filehandle(nfs_export *exp, int len, char *p)
1281 {
1282         FILE *f = fopen("/proc/fs/nfsd/filehandle", "r+");
1283         char buf[200];
1284         char *bp = buf;
1285         int failed;
1286         static struct nfs_fh_len fh;
1287
1288         if (!f)
1289                 f = fopen("/proc/fs/nfs/filehandle", "r+");
1290         if (!f)
1291                 return NULL;
1292
1293         qword_print(f, exp->m_client->m_hostname);
1294         qword_print(f, p);
1295         qword_printint(f, len); 
1296         failed = qword_eol(f);
1297         
1298         if (!failed)
1299                 failed = (fgets(buf, sizeof(buf), f) == NULL);
1300         fclose(f);
1301         if (failed)
1302                 return NULL;
1303         memset(fh.fh_handle, 0, sizeof(fh.fh_handle));
1304         fh.fh_size = qword_get(&bp, (char *)fh.fh_handle, NFS3_FHSIZE);
1305         return &fh;
1306 }