2011-02-04 42 views
3

我有以下问题:我有一个接收连接的epoll的代码:EBADF而recv的后epoll_wait

while (1) { 
    int nfds = epoll_wait(epollfd, events, 4096, -1); 
    if (nfds == -1) { 
     if (errno == EINTR) 
      continue; 
     perror("epoll_wait"); 
     exit(EXIT_FAILURE); 
    } 

    for (int i = 0; i < nfds; i++) { 
     if (events[i].data.fd == server_sock) { 
      client_sock = accept(server_sock, 
         (struct sockaddr *)&client_name, 
         (socklen_t *)(&client_name_len)); 

     if (client_sock == -1) //server overloaded 
      continue; 

     ev.events = EPOLLIN | EPOLLERR; 

#ifdef CORE_NONBLOCKING_SOCKETS 
     Arch::set_nonblocking(client_sock); 
     ev.events |= EPOLLET; //input data and connection closing 
#endif 


#ifdef EPOLLRDHUP 
     ev.events |= EPOLLRDHUP ;// 
#else 
     //for old libraries 
     ev.events |= EPOLLHUP;// 
#endif 

     ev.data.fd = client_sock; 

     if (epoll_ctl(epollfd, EPOLL_CTL_ADD, client_sock, &ev) == -1) { 
      perror("epoll_ctl: client_socket"); 
      exit(EXIT_FAILURE); 
     } 

     accept_request(client_sock); 

     } else { 

#ifdef EPOLLRDHUP 
      if (events[i].events & EPOLLRDHUP) { 
       std::cout << "EPOLLRDHUP on " << events[i].data.fd << std::endl; 
       listener->disconnectDriver(events[i].data.fd); 
      } 
#else 
      if (events[i].events & EPOLLHUP) { 
       std::cout << "EPOLLHUP on " << events[i].data.fd << std::endl; 
       listener->disconnectDriver(events[i].data.fd); 
      } 
#endif 
      if (events[i].events & EPOLLIN) { 
       std::cout << "debug EPOLLIN on " << events[i].data.fd << std::endl; 
       accept_request(events[i].data.fd); 
      } 

      if (events[i].events & EPOLLERR) { 
       std::cout << "debug EPOLLERR on " << events[i].data.fd << std::endl; 
       listener->disconnectDriver(events[i].data.fd); 
      } 


     } 
    } 

当我收到输入方面,我想读的所有BUFF数据:

void get_all_buf(int sock, std::string & inStr) { 
int n = 1; 
int total = 0; 

char c; 
char temp[1024*1024]; 

bzero(temp, sizeof(temp)); 

do { 
#ifdef CORE_NONBLOCKING_SOCKETS 
    timespec time_to_wait; 
    time_to_wait.tv_nsec = 10000000; 
    time_to_wait.tv_sec = 0; 
    timespec tm; 

    time_t begin = time(NULL); 
    do { 
#endif 

     n = recv(sock, &temp[total], sizeof(temp), 0); 

#ifdef CORE_NONBLOCKING_SOCKETS 
     nanosleep(&time_to_wait, &tm); 
     time_t end = time(NULL); 
     if ((end - begin) > MAX_CLIENT_TIME) { 
      inStr = std::string(); 
      return; 
     } 
    } while (n < 0 && errno == EAGAIN); //nonblocking sockets in edge-triggered mode 
#endif 

    if (n > 0) { 
     total += n; 
    } else if (n == 0) { 
     //TODO: error handling 
     //debug 
     std::cout << "possibly no one byte was received" << std::endl; 
     break; 
    } else if (n < 0) { 
     //TODO: error handling 
     //debug 
     std::cout << "error while receiving data" << std::endl; 
     if (errno == EBADF) { 
      std::cout << "recv returns with EBADF: " << strerror(errno) << std::endl; 
     } else if (errno == EFAULT) { 
      std::cout << "recv returns with EFAULT: " << strerror(errno) << std::endl; 
     } else if (errno == EINTR) { 
      std::cout << "recv returns with EINTR: " << strerror(errno) << std::endl; 
     } else if (errno == EINVAL) { 
      std::cout << "recv returns with EINVAL: " << strerror(errno) << std::endl; 
     } 
     //end debug 
     break; 
    } 

} while (!strstr(temp, "</packet>")); 
inStr = temp; 
}; 

accept_request函数内。但有时我获得以下在我的调试输出:

packet type='connect' 
size of vector<Driver> in getDriversWithMoney is 1 
epoll_wait detected activity of 164 counter i = 0 nfds = 1 
EPOLLRDHUP on 164 
disconnectDriver (fd = 164) 
driver 1 disconnected 
debug EPOLLIN on 164 
error while receiving data 
recv returns with EBADF: Invalid file descriptor 

这意味着有人在第一次连接断开相比,当他试图再次连接recv回报EBADF。我做错了什么?请帮帮我。

P.S.EPOLLRDHUP我只是关闭文件描述符。 epoll男人说没关系,因为epoll自己从epoll_wait排队关闭fd。

+0

尝试获得了`strace`日志。的问题。 – bdonlan 2011-02-04 07:35:57

+0

问题在于这个原位ation不规则。它在一段时间后变得起来了。 – milo 2011-02-04 07:39:00

回答

7

当远程主机关闭套接字时,epoll()报告文件描述符的HUPEPOLLIN

首先检查EPOLLRDHUP,然后关闭插座;那么你检查EPOLLIN,也找到,并尝试拨打recv()。由于套接字已关闭,文件描述符不再有效,并且您得到EBADF(将关闭的套接字从epoll集中移除,因此后续的epoll_wait()调用将不会返回;但对于已返回的epoll_wait()为时已晚 - 在EPOLLIN在您events[i]早已等候

你需要停下来检查事件,你叫disconnectDriver()之后(如果关闭了文件描述符):

 if (events[i].events & EPOLLRDHUP) { 
      std::cout << "EPOLLRDHUP on " << events[i].data.fd << std::endl; 
      listener->disconnectDriver(events[i].data.fd); 
      continue; 
     }