X-Git-Url: http://git.alex.org.uk diff --git a/nbd-server.c b/nbd-server.c index 3763d5a..5163fb3 100644 --- a/nbd-server.c +++ b/nbd-server.c @@ -3,6 +3,7 @@ * * Copyright 1996-1998 Pavel Machek, distribute under GPL * + * Copyright 2002 Anton Altaparmakov * * Version 1.0 - hopefully 64-bit-clean * Version 1.1 - merging enhancements from Josh Parsons, @@ -13,14 +14,42 @@ * with make FSCHOICE=-DFS_32BIT nbd-server. (I don't have the * original autoconf input file, or I would make it a configure * option.) Ken Yap . + * Version 1.6 - fix autodetection of block device size and really make 64 bit + * clean on 32 bit machines. Anton Altaparmakov + * Version 2.0 - Version synchronised with client + * Version 2.1 - Reap zombie client processes when they exit. Removed + * (uncommented) the _IO magic, it's no longer necessary. Wouter + * Verhelst + * Version 2.2 - Auto switch to read-only mode (usefull for floppies). + * Version 2.3 - Fixed code so that Large File Support works. This + * removes the FS_32BIT compile-time directive; define + * _FILE_OFFSET_BITS=64 and _LARGEFILE_SOURCE if you used to be + * using FS_32BIT. This will allow you to use files >2GB instead of + * having to use the -m option. Wouter Verhelst + * Version 2.4 - Added code to keep track of children, so that we can + * properly kill them from initscripts. Add a call to daemon(), + * so that processes don't think they have to wait for us, which is + * interesting for initscripts as well. Wouter Verhelst + * + * Version 2.5 - Bugfix release: forgot to reset child_arraysize to + * zero after fork()ing, resulting in nbd-server going berserk + * when it receives a signal with at least one child open. Wouter + * Verhelst + * 10/10/2003 - Added socket option SO_KEEPALIVE (sf.net bug 819235); + * rectified type of mainloop::size_host (sf.net bugs 814435 and + * 817385); close the PID file after writing to it, so that the + * daemon can actually be found. Wouter Verhelst + * */ -#define VERSION "1.5" +#define VERSION PACKAGE_VERSION #define GIGA (1*1024*1024*1024) #include #include #include +#include /* wait */ +#include /* sigaction */ #include #include /* sockaddr_in, htons, in_addr */ #include /* hostent, gethostby*, getservby* */ @@ -33,20 +62,19 @@ #include #include -#define _IO(a,b) +//#define _IO(a,b) // #define ISSERVER #define MY_NAME "nbd_server" -/* Authorization file should contain lines with IP addresses of - clients authorized to use the server. If it does not exist, - access is permitted. */ -#define AUTH_FILE "nbd_server.allow" +/* how much space for child PIDs we have by default. Dynamically + allocated, and will be realloc()ed if out of space, so this should + probably be fair for most situations. */ +#define DEFAULT_CHILD_ARRAY 256 #include "cliserv.h" -#undef _IO +//#undef _IO /* Deep magic: ioctl.h defines _IO macro (at least on linux) */ - /* Debugging macros, now nothing goes to syslog unless you say ISSERVER */ #ifdef ISSERVER #define msg2(a,b) syslog(a,b) @@ -58,19 +86,9 @@ #define msg4(a,b,c,d) do { fprintf(stderr,b,c,d); fputs("\n",stderr) ; } while(0) #endif - #include #include /* For BLKGETSIZE */ -#ifdef FS_32BIT -typedef u32 fsoffset_t; -#define htonll htonl -#define ntohll ntohl -#else -typedef u64 fsoffset_t; -#endif - - //#define DODBG #ifdef DODBG #define DEBUG( a ) printf( a ) @@ -82,39 +100,40 @@ typedef u64 fsoffset_t; #define DEBUG3( a,b,c ) #endif -#if defined(HAVE_LLSEEK) && !defined(sun) -/* Solaris already has llseek defined in unistd.h */ -extern long long llseek(unsigned int, long long, unsigned int); -#endif - -void serveconnection(int net) ; -void set_peername(int net,char *clientname) ; +void serveconnection(int net); +void set_peername(int net,char *clientname); #define LINELEN 256 -char difffilename[256] ; +char difffilename[256]; +unsigned int timeout = 0; +int autoreadonly = 0; +char *auth_file="nbd_server.allow"; int authorized_client(char *name) /* 0 - authorization refused, 1 - OK authorization file contains one line per machine, no wildcards */ -{ FILE *f ; +{ + FILE *f ; - char line[LINELEN] ; + char line[LINELEN] ; - if ((f=fopen(AUTH_FILE,"r"))==NULL) - { msg4(LOG_INFO,"Can't open authorization file %s (%s).", - AUTH_FILE,strerror(errno)) ; - return 1 ; - } + if ((f=fopen(auth_file,"r"))==NULL) { + msg4(LOG_INFO,"Can't open authorization file %s (%s).", + auth_file,strerror(errno)) ; + return 1 ; + } - while (fgets(line,LINELEN,f)!=NULL) { - if (strncmp(line,name,strlen(name))==0) { fclose(f) ; return 1 ; } - } - fclose(f) ; - return 0 ; + while (fgets(line,LINELEN,f)!=NULL) { + if (strncmp(line,name,strlen(name))==0) { + fclose(f); + return 1; + } + } + fclose(f) ; + return 0 ; } - inline void readit(int f, void *buf, int len) { int res; @@ -132,23 +151,31 @@ inline void writeit(int f, void *buf, int len) int res; while (len > 0) { DEBUG("+"); - if ((res = write(f, buf, len)) <= 0) - err("Write failed: %m"); + if ((res = send(f, buf, len, 0)) <= 0) + err("Send failed: %m"); len -= res; buf += res; } } +/* This is starting to get ugly. If someone knows a better way to find + * the maximum value of a signed type *without* relying on overflow + * (doing so breaks on 64bit architectures), that would be nice. + */ +#define OFFT_MAX (((((off_t)1)<<((sizeof(off_t)-1)*8))-1)<<7)+127 int port; /* Port I'm listening at */ char *exportname; /* File I'm exporting */ -fsoffset_t exportsize = ~0, hunksize = ~0; /* ...and its length */ +off_t exportsize = OFFT_MAX; /* ...and its length */ +off_t hunksize = OFFT_MAX; int flags = 0; int export[1024]; int difffile=-1 ; u32 difffilelen=0 ; /* number of pages in difffile */ u32 *difmap=NULL ; char clientname[256] ; - +int child_arraysize=DEFAULT_CHILD_ARRAY; +pid_t *children; +char pidfname[256]; #define DIFFPAGESIZE 4096 /* diff file uses those chunks */ @@ -162,10 +189,12 @@ void cmdline(int argc, char *argv[]) if (argc < 3) { printf("This is nbd-server version " VERSION "\n"); - printf("Usage: port file_to_export [size][kKmM] [-r] [-m] [-c]\n" + printf("Usage: port file_to_export [size][kKmM] [-r] [-m] [-c] [-a timeout_sec]\n" " -r read only\n" " -m multiple file\n" " -c copy on write\n" + " -l file with list of hosts that are allowed to connect.\n" + " -a maximum idle seconds, terminates when idle time exceeded\n" " if port is set to 0, stdin is used (for running from inetd)\n" " if file_to_export contains '%%s', it is substituted with IP\n" " address of machine trying to connect\n" ); @@ -182,17 +211,33 @@ void cmdline(int argc, char *argv[]) flags |= F_MULTIFILE; hunksize = 1*GIGA; break; - case 'c': flags |=F_COPYONWRITE ; - break ; + case 'c': flags |=F_COPYONWRITE; + break; + case 'l': + free(auth_file); + if (i+1 0) { + if(WIFEXITED(status)) { + msg3(LOG_INFO, "Child exited with %d", WEXITSTATUS(status)); + } + for(i=0;children[i]!=pid&&i=child_arraysize) { + msg3(LOG_INFO, "SIGCHLD received for an unknown child with PID %ld",(long) pid); + } else { + children[i]=(pid_t)0; + DEBUG2("Removing %d from the list of children", pid); + } + } +} + +/* If we are terminated, make sure our children are, too. */ +void sigterm_handler(int s) { + int i; + int parent=0; + + for(i=0;i0) { /* parent */ - close(net) ; continue ; } - /* child */ - close(sock) ; - msg2(LOG_INFO,"Starting to serve") ; - serveconnection(net) ; + if ((net = accept(sock, (struct sockaddr *) &addrin, &addrinlen)) < 0) + err("accept: %m"); + + set_peername(net,clientname) ; + if (!authorized_client(clientname)) { + msg2(LOG_INFO,"Unauthorized client") ; + close(net) ; + continue ; + } + msg2(LOG_INFO,"Authorized client") ; + for(i=0;children[i]&&i=child_arraysize) { + realloc(children, sizeof(pid_t)*child_arraysize); + memset(children+child_arraysize, 0, sizeof(pid_t)*DEFAULT_CHILD_ARRAY); + i=child_arraysize+1; + child_arraysize+=DEFAULT_CHILD_ARRAY; + } +#ifndef NOFORK + if ((children[i]=fork())<0) { + msg3(LOG_INFO,"Could not fork (%s)",strerror(errno)) ; + close(net) ; + continue ; + } + if (children[i]>0) { /* parent */ + close(net) ; continue ; } + /* child */ + realloc(children,0); + child_arraysize=0; + close(sock) ; +#endif // NOFORK + msg2(LOG_INFO,"Starting to serve") ; + serveconnection(net) ; } } #define SEND writeit( net, &reply, sizeof( reply )); #define ERROR { reply.error = htonl(-1); SEND; reply.error = 0; lastpoint = -1; } -fsoffset_t lastpoint = -1; +off_t lastpoint = (off_t)-1; -void maybeseek(int handle, fsoffset_t a) +void maybeseek(int handle, off_t a) { - if (a > exportsize) - err("Can not happen\n"); - if (lastpoint != a) { -#if defined(HAVE_LLSEEK) && !defined(FS_32BIT) - if (llseek(handle, a, SEEK_SET) < 0) -#else - if (lseek(handle, (long)a, SEEK_SET) < 0) -#endif - err("Can not seek locally!\n"); - lastpoint = a; - } else { - DEBUG("@"); - } +if (a > exportsize) + err("Can not happen\n"); +if (lastpoint != a) { + if (lseek(handle, a, SEEK_SET) < 0) + err("Can not seek locally!\n"); + lastpoint = a; +} else { + DEBUG("@"); +} } -void myseek(int handle,fsoffset_t a) +void myseek(int handle,off_t a) { -#if HAVE_LLSEEK && !defined(FS_32BIT) - if (llseek(handle, a, SEEK_SET) < 0) -#else - if (lseek(handle, (long)a, SEEK_SET) < 0) -#endif - err("Can not seek locally!\n"); + if (lseek(handle, a, SEEK_SET) < 0) + err("Can not seek locally!\n"); } -char pagebuf[DIFFPAGESIZE] ; +char pagebuf[DIFFPAGESIZE]; - -int rawexpread(fsoffset_t a, char *buf, int len) +int rawexpread(off_t a, char *buf, int len) { - maybeseek(export[a/hunksize], a%hunksize); - return (read(export[a/hunksize], buf, len) != len); + maybeseek(export[a/hunksize], a%hunksize); + return (read(export[a/hunksize], buf, len) != len); } -int expread(fsoffset_t a, char *buf, int len) -{ int rdlen ; fsoffset_t mapcnt,mapl,maph ; - fsoffset_t pagestart; int offset ; +int expread(off_t a, char *buf, int len) +{ + int rdlen, offset; + off_t mapcnt, mapl, maph, pagestart; - if (flags & F_COPYONWRITE) { - DEBUG3("Asked to read %d bytes at %lu.\n",len,(unsigned long)a) ; - - mapl=a/DIFFPAGESIZE ; maph=(a+len-1)/DIFFPAGESIZE ; - - for (mapcnt=mapl;mapcnt<=maph;mapcnt++) { - pagestart=mapcnt*DIFFPAGESIZE ; - offset=a-pagestart ; - rdlen=(lenhunksize) - rdlen=hunksize-(pagestart%hunksize) ; - if (rawexpread(pagestart,pagebuf,rdlen)) return -1 ; - memcpy(pagebuf+offset,buf,wrlen) ; - if (write(difffile,pagebuf,DIFFPAGESIZE)!=DIFFPAGESIZE) return -1 ; - } - len-=wrlen ; a+=wrlen ; buf+=wrlen ; - } - } else return(rawexpwrite(a,buf,len)); - return 0 ; +int expwrite(off_t a, char *buf, int len) +{ + u32 mapcnt,mapl,maph ; int wrlen,rdlen ; + off_t pagestart ; int offset ; + + if (!(flags & F_COPYONWRITE)) + return(rawexpwrite(a,buf,len)); + DEBUG3("Asked to write %d bytes at %Lu.\n", len, (unsigned long long)a); + + mapl=a/DIFFPAGESIZE ; maph=(a+len-1)/DIFFPAGESIZE ; + + for (mapcnt=mapl;mapcnt<=maph;mapcnt++) { + pagestart=mapcnt*DIFFPAGESIZE ; + offset=a-pagestart ; + wrlen=(lenhunksize) + rdlen=hunksize-(pagestart%hunksize) ; + if (rawexpread(pagestart,pagebuf,rdlen)) return -1 ; + memcpy(pagebuf+offset,buf,wrlen) ; + if (write(difffile,pagebuf,DIFFPAGESIZE)!=DIFFPAGESIZE) return -1 ; + } + len-=wrlen ; a+=wrlen ; buf+=wrlen ; + } + return 0; } int mainloop(int net) @@ -370,22 +506,16 @@ int mainloop(int net) struct nbd_reply reply; char zeros[300]; int i = 0; - fsoffset_t size_host; + u64 size_host; memset(zeros, 0, 290); if (write(net, INIT_PASSWD, 8) < 0) err("Negotiation failed: %m"); -#ifndef FS_32BIT cliserv_magic = htonll(cliserv_magic); -#endif if (write(net, &cliserv_magic, sizeof(cliserv_magic)) < 0) err("Negotiation failed: %m"); - size_host = htonll(exportsize); -#ifdef FS_32BIT - if (write(net, zeros, 4) < 0 || write(net, &size_host, 4) < 0) -#else + size_host = htonll((u64)exportsize); if (write(net, &size_host, 8) < 0) -#endif err("Negotiation failed: %m"); if (write(net, zeros, 128) < 0) err("Negotiation failed: %m"); @@ -397,12 +527,13 @@ int mainloop(int net) #define BUFSIZE (1024*1024) char buf[BUFSIZE]; int len; - #ifdef DODBG i++; printf("%d: ", i); #endif + if (timeout) + alarm(timeout); readit(net, &request, sizeof(request)); request.from = ntohll(request.from); request.type = ntohl(request.type); @@ -421,11 +552,17 @@ int mainloop(int net) if (len > BUFSIZE) err("Request too big!"); #ifdef DODBG - printf("%s from %d (%d) len %d, ", (request.type ? "WRITE" : "READ"), - (int) request.from, (int) request.from / 512, len); + printf("%s from %Lu (%Lu) len %d, ", request.type ? "WRITE" : + "READ", (unsigned long long)request.from, + (unsigned long long)request.from / 512, len); #endif memcpy(reply.handle, request.handle, sizeof(reply.handle)); - if (((request.from + len) > exportsize) || + if ((request.from + len) > (OFFT_MAX)) { + DEBUG("[Number too large!]"); + ERROR; + continue; + } + if ((((off_t)request.from + len) > exportsize) || ((flags & F_READONLY) && request.type)) { DEBUG("[RANGE!]"); ERROR; @@ -435,13 +572,14 @@ int mainloop(int net) DEBUG("wr: net->buf, "); readit(net, buf, len); DEBUG("buf->exp, "); - if (expwrite(request.from, buf, len)) { + if ((autoreadonly == 1) || expwrite(request.from, buf, len)) { DEBUG("Write failed: %m" ); ERROR; continue; } lastpoint += len; SEND; + DEBUG("OK!\n"); continue; } /* READ */ @@ -479,37 +617,45 @@ void set_peername(int net,char *clientname) strncpy(clientname,peername,255) ; } -fsoffset_t size_autodetect(int export) +off_t size_autodetect(int export) { - fsoffset_t es; + off_t es; + u32 es32; + struct stat stat_buf; + int error; + DEBUG("looking for export size with lseek SEEK_END\n"); - if ((int)(es = lseek(export, 0, SEEK_END)) == -1 || es == 0) { - struct stat stat_buf; - int error; - DEBUG("looking for export size with fstat\n"); - stat_buf.st_size = 0; - if ((error = fstat(export, &stat_buf)) == -1 || stat_buf.st_size == 0 ) { - DEBUG("looking for export size with ioctl BLKGETSIZE\n"); + es = lseek(export, (off_t)0, SEEK_END); + if (es > ((off_t)0)) { + return es; + } else { + DEBUG2("lseek failed: %d", errno==EBADF?1:(errno==ESPIPE?2:(errno==EINVAL?3:4))); + } + + DEBUG("looking for export size with fstat\n"); + stat_buf.st_size = 0; + error = fstat(export, &stat_buf); + if (!error && stat_buf.st_size > 0) { + return (off_t)stat_buf.st_size; + } else { + err("fstat failed: %m"); + } + #ifdef BLKGETSIZE - if(ioctl(export, BLKGETSIZE, &es) || es == 0) { -#else - if(1){ -#endif - err("Could not find size of exported block device: %m"); - } else { - es *= 512; /* assume blocksize 512 */ - } - } else { - es = stat_buf.st_size; - } + DEBUG("looking for export size with ioctl BLKGETSIZE\n"); + if (!ioctl(export, BLKGETSIZE, &es32) && es32) { + es = (off_t)es32 * (off_t)512; + return es; } - return es; +#endif + err("Could not find size of exported block device: %m"); + return OFFT_MAX; } int main(int argc, char *argv[]) { int net; - fsoffset_t i; + off_t i; if (sizeof( struct nbd_request )!=28) { fprintf(stderr,"Bad size of structure. Alignment problems?\n"); @@ -526,47 +672,44 @@ int main(int argc, char *argv[]) void serveconnection(int net) { - u64 i ; - - for (i=0; i (~0UL >> 1)) -#ifdef HAVE_LLSEEK - if ((exportsize >> 10) > (~0UL >> 1)) - msg3(LOG_INFO, "size of exported file/device is %luMB", - (unsigned long)(exportsize >> 20)); - else - msg3(LOG_INFO, "size of exported file/device is %luKB", - (unsigned long)(exportsize >> 10)); -#else - err("Size of exported file is too big\n"); -#endif - else - msg3(LOG_INFO, "size of exported file/device is %lu", - (unsigned long)exportsize); - - if (flags & F_COPYONWRITE) { - sprintf(difffilename,"%s-%s-%d.diff",exportname2,clientname, - (int)getpid()) ; - msg3(LOG_INFO,"About to create map and diff file %s",difffilename) ; - difffile=open(difffilename,O_RDWR | O_CREAT | O_TRUNC,0600) ; - if (difffile<0) err("Could not create diff file (%m)") ; - if ((difmap=calloc(exportsize/DIFFPAGESIZE,sizeof(u32)))==NULL) - err("Could not allocate memory") ; - for (i=0;i (off_t)OFFT_MAX) { + err("Size of exported file is too big\n"); + } + else + msg3(LOG_INFO, "size of exported file/device is %Lu", + (unsigned long long)exportsize); + + if (flags & F_COPYONWRITE) { + sprintf(difffilename,"%s-%s-%d.diff",exportname2,clientname, + (int)getpid()) ; + msg3(LOG_INFO,"About to create map and diff file %s",difffilename) ; + difffile=open(difffilename,O_RDWR | O_CREAT | O_TRUNC,0600) ; + if (difffile<0) err("Could not create diff file (%m)") ; + if ((difmap=calloc(exportsize/DIFFPAGESIZE,sizeof(u32)))==NULL) + err("Could not allocate memory") ; + for (i=0;i