linux内核之accept实现
- 用户态对accept的标准用法:
- if ((client_fd = accept(sockfd, (struct sockaddr *)&remote_addr, &sin_size)) == -1)
- {
- //accept()函数让服务器接收客户的连接请求
- perror("accept Error\n");
- continue;
- }
- sockfd是通过socket系统调用,并且经过listen过的套接字:
- sockfd = socket(AF_INET, SOCK_STREAM, 0)
- listen(sockfd, 128)
- remote_addr将会存储远端设备的地址信息。
SYSCALL_DEFINE3(accept,int, fd,struct sockaddr __user *, upeer_sockaddr,int __user *, upeer_addrlen){return sys_accept4(fd, upeer_sockaddr, upeer_addrlen,0);}
SYSCALL_DEFINE4(accept4,int, fd,struct sockaddr __user *, upeer_sockaddr,int __user *, upeer_addrlen,int, flags){struct socket *sock,*newsock;struct file *newfile;int err, len, newfd, fput_needed;struct sockaddr_storage address;if(flags &~(SOCK_CLOEXEC | SOCK_NONBLOCK)){return-EINVAL;}if(SOCK_NONBLOCK != O_NONBLOCK &&(flags & SOCK_NONBLOCK)){flags =(flags &~SOCK_NONBLOCK)| O_NONBLOCK;}sock = sockfd_lookup_light(fd,&err,&fput_needed);if(!sock){goto out;}err =-ENFILE;newsock = sock_alloc();/*! 1.创建新的sock给新的连接 */if(!newsock){goto out_put;}newsock->type = sock->type;newsock->ops = sock->ops;/** We don't need try_module_get here, as the listening socket (sock)* has the protocol module (sock->ops->owner) held.*/__module_get(newsock->ops->owner);newfd = get_unused_fd_flags(flags);/*! 2.分配一个fd给新的连接 */if(unlikely(newfd <0)){err = newfd;sock_release(newsock);goto out_put;}newfile = sock_alloc_file(newsock, flags, sock->sk->sk_prot_creator->name);/*! 3.为newsock创建一个对应的file结构 */if(unlikely(IS_ERR(newfile))){err = PTR_ERR(newfile);put_unused_fd(newfd);sock_release(newsock);goto out_put;}err = security_socket_accept(sock, newsock);if(err){goto out_fd;}err = sock->ops->accept(sock, newsock, sock->file->f_flags);/*! 4.调用Socket层操作函数inet_accept() */if(err <0){goto out_fd;}if(upeer_sockaddr){if(newsock->ops->getname(newsock,(struct sockaddr *)&address,&len,2)<0){err =-ECONNABORTED;goto out_fd;}err = move_addr_to_user(&address,len, upeer_sockaddr, upeer_addrlen);if(err <0){goto out_fd;}}/* File flags are not inherited via accept() unlike another OSes. */fd_install(newfd, newfile);err = newfd;out_put:fput_light(sock->file, fput_needed);out:return err;out_fd:fput(newfile);put_unused_fd(newfd);goto out_put;}
struct file *sock_alloc_file(struct socket *sock,int flags,constchar*dname){struct qstr name ={.name =""};struct path path;struct file *file;if(dname){name.name = dname;name.len = strlen(name.name);}elseif(sock->sk){name.name = sock->sk->sk_prot_creator->name;name.len = strlen(name.name);}path.dentry = d_alloc_pseudo(sock_mnt->mnt_sb,&name);if(unlikely(!path.dentry)){return ERR_PTR(-ENOMEM);}path.mnt = mntget(sock_mnt);d_instantiate(path.dentry, SOCK_INODE(sock));file = alloc_file(&path, FMODE_READ | FMODE_WRITE,&socket_file_ops);if(unlikely(IS_ERR(file))){/* drop dentry, keep inode */ihold(path.dentry->d_inode);path_put(&path);return file;}/*! 注意这里的属性设置 */sock->file = file;file->f_flags = O_RDWR |(flags & O_NONBLOCK);file->private_data = sock;return file;}
/** Accept a pending connection. The TCP layer now gives BSD semantics.*/// <net/ipv4/af_inet.c>int inet_accept(struct socket *sock,struct socket *newsock,int flags){struct sock *sk1 = sock->sk;int err =-EINVAL;/*** 如果使用的是TCP,则sk_prot为tcp_prot,accept为inet_csk_accept()* 获取新连接的sock。*/struct sock *sk2 = sk1->sk_prot->accept(sk1, flags,&err);/*! 4.1.获取新连接的sock */if(!sk2){goto do_err;}lock_sock(sk2);sock_rps_record_flow(sk2);WARN_ON(!((1<< sk2->sk_state)&(TCPF_ESTABLISHED | TCPF_SYN_RECV |TCPF_CLOSE_WAIT | TCPF_CLOSE)));sock_graft(sk2, newsock);/*! 4.2.把sock和socket嫁接起来,让它们能相互索引 */newsock->state = SS_CONNECTED;/*! 4.3.把新socket的状态设为已连接 */err =0;release_sock(sk2);do_err:return err;}
// <net/Sock.h>staticinlinevoid sock_graft(struct sock *sk,struct socket *parent){write_lock_bh(&sk->sk_callback_lock);sk->sk_wq = parent->wq;parent->sk = sk; /*! INET层的socket使用下层的sock服务 */sk_set_socket(sk, parent);security_sock_graft(sk, parent);write_unlock_bh(&sk->sk_callback_lock);}
// <net/ipv4/Inet_connection_sock.c>/** This will accept the next outstanding connection.*/struct sock *inet_csk_accept(struct sock *sk,int flags,int*err){struct inet_connection_sock *icsk = inet_csk(sk);struct request_sock_queue *queue=&icsk->icsk_accept_queue;struct sock *newsk;struct request_sock *req;int error;lock_sock(sk);/* We need to make sure that this socket is listening,* and that it has something pending.*/error =-EINVAL;if(sk->sk_state != TCP_LISTEN){goto out_err;}/* Find already established connection */if(reqsk_queue_empty(queue))// 没有ESTABLISHED状态的连接请求块{long timeo = sock_rcvtimeo(sk, flags & O_NONBLOCK);/* If this is a non blocking socket don't sleep */error =-EAGAIN;if(!timeo){goto out_err;}/*! 4.1.1 阻塞等待,直到有全连接。如果用户设置有等待时间,超时后会退出 */error = inet_csk_wait_for_connect(sk, timeo);if(error){goto out_err;}}/*! 从全连接队列中取出第一个established状态的连接请求块 */req = reqsk_queue_remove(queue);newsk = req->sk;sk_acceptq_removed(sk);if(sk->sk_protocol == IPPROTO_TCP &&queue->fastopenq != NULL){spin_lock_bh(&queue->fastopenq->lock);if(tcp_rsk(req)->listener){/* We are still waiting for the final ACK from 3WHS* so can't free req now. Instead, we set req->sk to* NULL to signify that the child socket is taken* so reqsk_fastopen_remove() will free the req* when 3WHS finishes (or is aborted).*/req->sk = NULL;req = NULL;}spin_unlock_bh(&queue->fastopenq->lock);}out:release_sock(sk);if(req){__reqsk_free(req);}return newsk;out_err:newsk = NULL;req = NULL;*err = error;goto out;}
// <net/ipv4/Inet_connection_sock.c>/** Wait for an incoming connection, avoid race conditions. This must be called* with the socket locked.*/staticint inet_csk_wait_for_connect(struct sock *sk,long timeo){struct inet_connection_sock *icsk = inet_csk(sk);DEFINE_WAIT(wait);int err;/** True wake-one mechanism for incoming connections: only* one process gets woken up, not the 'whole herd'.* Since we do not 'race & poll' for established sockets* anymore, the common case will execute the loop only once.** Subtle issue: "add_wait_queue_exclusive()" will be added* after any current non-exclusive waiters, and we know that* it will always _stay_ after any new non-exclusive waiters* because all non-exclusive waiters are added at the* beginning of the wait-queue. As such, it's ok to "drop"* our exclusiveness temporarily when we get woken up without* having to remove and re-insert us on the wait queue.*/for(;;){/*! 把自己加入到等待队列,并且设置自己的状态是可中断的 */prepare_to_wait_exclusive(sk_sleep(sk),&wait,TASK_INTERRUPTIBLE);release_sock(sk);if(reqsk_queue_empty(&icsk->icsk_accept_queue)){/*** 用户发起的accept操作就停schedule_timeout中* switch (timeout)* {* case MAX_SCHEDULE_TIMEOUT:* schedule();* goto out;* default:* }* 根据其实现代码,由于我们一般没有设置timeout值,所以是MAX_SCHEDULE_TIMEOUT的情况,这表示立即进入重新调度,* 而当前的进程可以处于睡眠,直到被其它事件唤醒。*/timeo = schedule_timeout(timeo);}sched_annotate_sleep();lock_sock(sk);err =0;if(!reqsk_queue_empty(&icsk->icsk_accept_queue)){break;}err =-EINVAL;if(sk->sk_state != TCP_LISTEN){break;}err = sock_intr_errno(timeo);if(signal_pending(current)){break;}err =-EAGAIN;if(!timeo){break;}}/*! 下面把任务设置成TASK_RUNNING状态,然后把当前sock从等待队列中删除 */finish_wait(sk_sleep(sk),&wait);return err;}
linux内核之accept实现的更多相关文章
- linux内核的makefile.txt讲解
linux内核的linux-3.6.5\Documentation\kbuild\makefiles.txt Linux Kernel Makefiles This document describe ...
- Linux内核参数配置
Linux在系统运行时修改内核参数(/proc/sys与/etc/sysctl.conf),而不需要重新引导系统,这个功能是通过/proc虚拟文件系统实现的. 在/proc/sys目录下存放着大多数的 ...
- Linux内核 TCP/IP、Socket参数调优
Linux内核 TCP/IP.Socket参数调优 2014-06-06 Harrison.... 阅 9611 转 165 转藏到我的图书馆 微信分享: Doc1: /proc/sy ...
- Linux内核--网络栈实现分析(一)--网络栈初始化
本文分析基于内核Linux Kernel 1.2.13 原创作品,转载请标明http://blog.csdn.net/yming0221/article/details/7488828 更多请看专栏, ...
- Linux内核Makefile文件(翻译自内核手册)
--译自Linux3.9.5 Kernel Makefiles(内核目录documention/kbuild/makefiles.txt) kbuild(kernel build) 内核编译器 Thi ...
- linux内核数据结构学习总结
目录 . 进程相关数据结构 ) struct task_struct ) struct cred ) struct pid_link ) struct pid ) struct signal_stru ...
- linux 内核参数图解
https://www.suse.com/documentation/sles11/book_sle_tuning/data/part_tuning_kernel.html http://blog.c ...
- Linux内核--网络栈实现分析(一)--网络栈初始化--转
转载地址 http://blog.csdn.net/yming0221/article/details/7488828 作者:闫明 本文分析基于内核Linux Kernel 1.2.13 以后的系列博 ...
- TCP/IP协议栈源码图解分析系列10:linux内核协议栈中对于socket相关API的实现
题记:本系列文章的目的是抛开书本从Linux内核源代码的角度详细分析TCP/IP协议栈内核相关技术 轻松搞定TCP/IP协议栈,原创文章欢迎交流, byhankswang@gmail.com linu ...
随机推荐
- 旧题新做:从idy的视角看数据结构
“今天你不写总结……!!!” 额…… 还是讲我的吧.这些考试都是idy出的题. 20170121:DFS序. ST表.线段树练习 这是第一次考数据结构. Problem 1. setsum 1 sec ...
- Apache+tomcat配置动静分离(一个apache一个tomcat,没有做集群)
1. 下载apache http server,tomcat,mok_jk.so apache下载地址:http://httpd.apache.org/download.cgi tomcat下载地址: ...
- Qt 编写多窗口程序
该文章原创于Qter开源社区(www.qter.org),作者yafeilinux,转载请注明出处! 导语 程序要实现的功能是:程序开始出现一个对话框,按下按钮后便能进入主窗口,如果直接关闭 ...
- UIScrollview 与 Autolayout 的那点事
原文 http://www.cocoachina.com/ios/20151221/14757.html 前言 自从写了 介绍Masonry 那篇文章以后 就一直有人对UIScrollView的那个 ...
- .Net Framework4.0 ashx页面报错:检测到有潜在危险的Request.Form值
前些日子做项目的时候遇到一个问题,在ASP.NET 中使用JQuery的AJAX调用一般处理程序ashx出错,在处理程序中错误提示如下:从客户端(Text="<img alt=&quo ...
- 转:Block原理及引用循环问题
2010年WWDC发布iOS4时Apple对Objective-C进行了一次重要的升级:支持Block.说到底这东西就是闭包,其他高级语音例如Java和C++已有支持,第一次使用Block感觉满简单好 ...
- isscroll插件 实现下拉加载 上啦刷新 转
http://www.jb51.net/article/98394.htm 下面是别人的代码 <!DOCTYPE html> <html> <head> <m ...
- vue短信验证性能优化写入localstorage中
平时我们在项目中进行注册等的时候,会经常用到短信验证的功能,但是现在现在很多短信验证都是存在下面几个问题,例如短信验证时间为60s的时候, 1. 当点击完按钮时,倒计时还没到60s过完时,刷新浏览器, ...
- Linux_用户管理&权限管理
2017年1月11日, 星期三 Linux_用户管理&权限管理 1. Linux用户管理&权限管理 终端的概念: tty 查看登录的终端 类型 user group oth ...
- 取消IE下的叉
之前写项目的时候碰到一个小问题,因为IE下的那个叉触发不了我的change事件,所以只好把IE给加上去的那个叉去了,在此记录一下. ::-ms-clear{display:none;} ::-ms-r ...