linux内核之accept实现
- 用户态对accept的标准用法:
- if ((client_fd = accept(sockfd, (struct sockaddr *)&remote_addr, &sin_size)) == -1)
- {
- //accept()函数让服务器接收客户的连接请求
- perror("accept Error\n");
- continue;
- }
- sockfd是通过socket系统调用,并且经过listen过的套接字:
- sockfd = socket(AF_INET, SOCK_STREAM, 0)
- listen(sockfd, 128)
- remote_addr将会存储远端设备的地址信息。
SYSCALL_DEFINE3(accept,int, fd,struct sockaddr __user *, upeer_sockaddr,int __user *, upeer_addrlen){return sys_accept4(fd, upeer_sockaddr, upeer_addrlen,0);}
SYSCALL_DEFINE4(accept4,int, fd,struct sockaddr __user *, upeer_sockaddr,int __user *, upeer_addrlen,int, flags){struct socket *sock,*newsock;struct file *newfile;int err, len, newfd, fput_needed;struct sockaddr_storage address;if(flags &~(SOCK_CLOEXEC | SOCK_NONBLOCK)){return-EINVAL;}if(SOCK_NONBLOCK != O_NONBLOCK &&(flags & SOCK_NONBLOCK)){flags =(flags &~SOCK_NONBLOCK)| O_NONBLOCK;}sock = sockfd_lookup_light(fd,&err,&fput_needed);if(!sock){goto out;}err =-ENFILE;newsock = sock_alloc();/*! 1.创建新的sock给新的连接 */if(!newsock){goto out_put;}newsock->type = sock->type;newsock->ops = sock->ops;/** We don't need try_module_get here, as the listening socket (sock)* has the protocol module (sock->ops->owner) held.*/__module_get(newsock->ops->owner);newfd = get_unused_fd_flags(flags);/*! 2.分配一个fd给新的连接 */if(unlikely(newfd <0)){err = newfd;sock_release(newsock);goto out_put;}newfile = sock_alloc_file(newsock, flags, sock->sk->sk_prot_creator->name);/*! 3.为newsock创建一个对应的file结构 */if(unlikely(IS_ERR(newfile))){err = PTR_ERR(newfile);put_unused_fd(newfd);sock_release(newsock);goto out_put;}err = security_socket_accept(sock, newsock);if(err){goto out_fd;}err = sock->ops->accept(sock, newsock, sock->file->f_flags);/*! 4.调用Socket层操作函数inet_accept() */if(err <0){goto out_fd;}if(upeer_sockaddr){if(newsock->ops->getname(newsock,(struct sockaddr *)&address,&len,2)<0){err =-ECONNABORTED;goto out_fd;}err = move_addr_to_user(&address,len, upeer_sockaddr, upeer_addrlen);if(err <0){goto out_fd;}}/* File flags are not inherited via accept() unlike another OSes. */fd_install(newfd, newfile);err = newfd;out_put:fput_light(sock->file, fput_needed);out:return err;out_fd:fput(newfile);put_unused_fd(newfd);goto out_put;}
struct file *sock_alloc_file(struct socket *sock,int flags,constchar*dname){struct qstr name ={.name =""};struct path path;struct file *file;if(dname){name.name = dname;name.len = strlen(name.name);}elseif(sock->sk){name.name = sock->sk->sk_prot_creator->name;name.len = strlen(name.name);}path.dentry = d_alloc_pseudo(sock_mnt->mnt_sb,&name);if(unlikely(!path.dentry)){return ERR_PTR(-ENOMEM);}path.mnt = mntget(sock_mnt);d_instantiate(path.dentry, SOCK_INODE(sock));file = alloc_file(&path, FMODE_READ | FMODE_WRITE,&socket_file_ops);if(unlikely(IS_ERR(file))){/* drop dentry, keep inode */ihold(path.dentry->d_inode);path_put(&path);return file;}/*! 注意这里的属性设置 */sock->file = file;file->f_flags = O_RDWR |(flags & O_NONBLOCK);file->private_data = sock;return file;}
/** Accept a pending connection. The TCP layer now gives BSD semantics.*/// <net/ipv4/af_inet.c>int inet_accept(struct socket *sock,struct socket *newsock,int flags){struct sock *sk1 = sock->sk;int err =-EINVAL;/*** 如果使用的是TCP,则sk_prot为tcp_prot,accept为inet_csk_accept()* 获取新连接的sock。*/struct sock *sk2 = sk1->sk_prot->accept(sk1, flags,&err);/*! 4.1.获取新连接的sock */if(!sk2){goto do_err;}lock_sock(sk2);sock_rps_record_flow(sk2);WARN_ON(!((1<< sk2->sk_state)&(TCPF_ESTABLISHED | TCPF_SYN_RECV |TCPF_CLOSE_WAIT | TCPF_CLOSE)));sock_graft(sk2, newsock);/*! 4.2.把sock和socket嫁接起来,让它们能相互索引 */newsock->state = SS_CONNECTED;/*! 4.3.把新socket的状态设为已连接 */err =0;release_sock(sk2);do_err:return err;}
// <net/Sock.h>staticinlinevoid sock_graft(struct sock *sk,struct socket *parent){write_lock_bh(&sk->sk_callback_lock);sk->sk_wq = parent->wq;parent->sk = sk; /*! INET层的socket使用下层的sock服务 */sk_set_socket(sk, parent);security_sock_graft(sk, parent);write_unlock_bh(&sk->sk_callback_lock);}
// <net/ipv4/Inet_connection_sock.c>/** This will accept the next outstanding connection.*/struct sock *inet_csk_accept(struct sock *sk,int flags,int*err){struct inet_connection_sock *icsk = inet_csk(sk);struct request_sock_queue *queue=&icsk->icsk_accept_queue;struct sock *newsk;struct request_sock *req;int error;lock_sock(sk);/* We need to make sure that this socket is listening,* and that it has something pending.*/error =-EINVAL;if(sk->sk_state != TCP_LISTEN){goto out_err;}/* Find already established connection */if(reqsk_queue_empty(queue))// 没有ESTABLISHED状态的连接请求块{long timeo = sock_rcvtimeo(sk, flags & O_NONBLOCK);/* If this is a non blocking socket don't sleep */error =-EAGAIN;if(!timeo){goto out_err;}/*! 4.1.1 阻塞等待,直到有全连接。如果用户设置有等待时间,超时后会退出 */error = inet_csk_wait_for_connect(sk, timeo);if(error){goto out_err;}}/*! 从全连接队列中取出第一个established状态的连接请求块 */req = reqsk_queue_remove(queue);newsk = req->sk;sk_acceptq_removed(sk);if(sk->sk_protocol == IPPROTO_TCP &&queue->fastopenq != NULL){spin_lock_bh(&queue->fastopenq->lock);if(tcp_rsk(req)->listener){/* We are still waiting for the final ACK from 3WHS* so can't free req now. Instead, we set req->sk to* NULL to signify that the child socket is taken* so reqsk_fastopen_remove() will free the req* when 3WHS finishes (or is aborted).*/req->sk = NULL;req = NULL;}spin_unlock_bh(&queue->fastopenq->lock);}out:release_sock(sk);if(req){__reqsk_free(req);}return newsk;out_err:newsk = NULL;req = NULL;*err = error;goto out;}
// <net/ipv4/Inet_connection_sock.c>/** Wait for an incoming connection, avoid race conditions. This must be called* with the socket locked.*/staticint inet_csk_wait_for_connect(struct sock *sk,long timeo){struct inet_connection_sock *icsk = inet_csk(sk);DEFINE_WAIT(wait);int err;/** True wake-one mechanism for incoming connections: only* one process gets woken up, not the 'whole herd'.* Since we do not 'race & poll' for established sockets* anymore, the common case will execute the loop only once.** Subtle issue: "add_wait_queue_exclusive()" will be added* after any current non-exclusive waiters, and we know that* it will always _stay_ after any new non-exclusive waiters* because all non-exclusive waiters are added at the* beginning of the wait-queue. As such, it's ok to "drop"* our exclusiveness temporarily when we get woken up without* having to remove and re-insert us on the wait queue.*/for(;;){/*! 把自己加入到等待队列,并且设置自己的状态是可中断的 */prepare_to_wait_exclusive(sk_sleep(sk),&wait,TASK_INTERRUPTIBLE);release_sock(sk);if(reqsk_queue_empty(&icsk->icsk_accept_queue)){/*** 用户发起的accept操作就停schedule_timeout中* switch (timeout)* {* case MAX_SCHEDULE_TIMEOUT:* schedule();* goto out;* default:* }* 根据其实现代码,由于我们一般没有设置timeout值,所以是MAX_SCHEDULE_TIMEOUT的情况,这表示立即进入重新调度,* 而当前的进程可以处于睡眠,直到被其它事件唤醒。*/timeo = schedule_timeout(timeo);}sched_annotate_sleep();lock_sock(sk);err =0;if(!reqsk_queue_empty(&icsk->icsk_accept_queue)){break;}err =-EINVAL;if(sk->sk_state != TCP_LISTEN){break;}err = sock_intr_errno(timeo);if(signal_pending(current)){break;}err =-EAGAIN;if(!timeo){break;}}/*! 下面把任务设置成TASK_RUNNING状态,然后把当前sock从等待队列中删除 */finish_wait(sk_sleep(sk),&wait);return err;}
linux内核之accept实现的更多相关文章
- linux内核的makefile.txt讲解
linux内核的linux-3.6.5\Documentation\kbuild\makefiles.txt Linux Kernel Makefiles This document describe ...
- Linux内核参数配置
Linux在系统运行时修改内核参数(/proc/sys与/etc/sysctl.conf),而不需要重新引导系统,这个功能是通过/proc虚拟文件系统实现的. 在/proc/sys目录下存放着大多数的 ...
- Linux内核 TCP/IP、Socket参数调优
Linux内核 TCP/IP.Socket参数调优 2014-06-06 Harrison.... 阅 9611 转 165 转藏到我的图书馆 微信分享: Doc1: /proc/sy ...
- Linux内核--网络栈实现分析(一)--网络栈初始化
本文分析基于内核Linux Kernel 1.2.13 原创作品,转载请标明http://blog.csdn.net/yming0221/article/details/7488828 更多请看专栏, ...
- Linux内核Makefile文件(翻译自内核手册)
--译自Linux3.9.5 Kernel Makefiles(内核目录documention/kbuild/makefiles.txt) kbuild(kernel build) 内核编译器 Thi ...
- linux内核数据结构学习总结
目录 . 进程相关数据结构 ) struct task_struct ) struct cred ) struct pid_link ) struct pid ) struct signal_stru ...
- linux 内核参数图解
https://www.suse.com/documentation/sles11/book_sle_tuning/data/part_tuning_kernel.html http://blog.c ...
- Linux内核--网络栈实现分析(一)--网络栈初始化--转
转载地址 http://blog.csdn.net/yming0221/article/details/7488828 作者:闫明 本文分析基于内核Linux Kernel 1.2.13 以后的系列博 ...
- TCP/IP协议栈源码图解分析系列10:linux内核协议栈中对于socket相关API的实现
题记:本系列文章的目的是抛开书本从Linux内核源代码的角度详细分析TCP/IP协议栈内核相关技术 轻松搞定TCP/IP协议栈,原创文章欢迎交流, byhankswang@gmail.com linu ...
随机推荐
- MongoDB 安装及开启关闭
开启关闭的方式: 命令行 输入 net start mongodb 就打开mongo的服务了 输入 net stop mongodb 关闭服务 验证是否成功的方式: 在浏览器中输入 http://lo ...
- github怎么绑定自己的域名
本文前提是你已经搭建好了博客. CAST: 1 没有域名的话先去申请一个域名 如果想简单省心,不计较时间和金钱的话,那就阿里云或腾讯云买全套大宝剑(服务器+域名+解析). 因为本人不想备案(时间长), ...
- 字典的setdefault() 和get()方法比较
Python 字典 setdefault() 函数 和get() 类似: 如果键存在字典中,返回其value值 如果键不存在字典中,创建键值对.完后,返回值为默认值. 话不多说,上栗子: setdef ...
- mysql 设置默认编码为 utf8
vi /etc/mysql/mysql.conf.d/mysqld.cnf [client] default-character-set=utf8 [mysql] default-character- ...
- Sitemesh 3使用及配置
1:Sitemesh简介 SiteMesh是一个网页布局和修饰的框架,利用它可以将网页的内容和页面结构分离,以达到页面结构共享的目的. SiteMesh是基于Servlet的filter的,即过滤流. ...
- mq使用场景、不丢不重、时序性
mq使用场景.不丢不重.时序性.削峰 参考: http://zhuanlan.51cto.com/art/201704/536407.htm http://zhuanlan.51cto.com/art ...
- Java并发编程原理与实战三十六:阻塞队列&消息队列
一.阻塞队列 1.阻塞队列BlockingQueue ---->可以理解成生产者消费者的模式---->消费者要等待到生产者生产出来产品.---->而非阻塞队列ConcurrentLi ...
- 经典全屏滚动插件fullPage.js
要写简单可以写的很简单,对着github上面的参数和注释随便写了个demo.这个插件十分高端大气上档次,配上良好的配色和布局,简单几笔就可以把网站装扮得十分洋气. 唯一的缺点就是,感觉对移动端的兼容性 ...
- 出了一个js的题。
class test { set xx(v){ console.log('i am set'); this.__ok = v; } get xx(){ console.log('i am get'); ...
- CodeForces - 1042B
Berland shop sells nn kinds of juices. Each juice has its price cici. Each juice includes some set o ...