linux内核之accept实现
- 用户态对accept的标准用法:
- if ((client_fd = accept(sockfd, (struct sockaddr *)&remote_addr, &sin_size)) == -1)
- {
- //accept()函数让服务器接收客户的连接请求
- perror("accept Error\n");
- continue;
- }
- sockfd是通过socket系统调用,并且经过listen过的套接字:
- sockfd = socket(AF_INET, SOCK_STREAM, 0)
- listen(sockfd, 128)
- remote_addr将会存储远端设备的地址信息。
SYSCALL_DEFINE3(accept,int, fd,struct sockaddr __user *, upeer_sockaddr,int __user *, upeer_addrlen){return sys_accept4(fd, upeer_sockaddr, upeer_addrlen,0);}
SYSCALL_DEFINE4(accept4,int, fd,struct sockaddr __user *, upeer_sockaddr,int __user *, upeer_addrlen,int, flags){struct socket *sock,*newsock;struct file *newfile;int err, len, newfd, fput_needed;struct sockaddr_storage address;if(flags &~(SOCK_CLOEXEC | SOCK_NONBLOCK)){return-EINVAL;}if(SOCK_NONBLOCK != O_NONBLOCK &&(flags & SOCK_NONBLOCK)){flags =(flags &~SOCK_NONBLOCK)| O_NONBLOCK;}sock = sockfd_lookup_light(fd,&err,&fput_needed);if(!sock){goto out;}err =-ENFILE;newsock = sock_alloc();/*! 1.创建新的sock给新的连接 */if(!newsock){goto out_put;}newsock->type = sock->type;newsock->ops = sock->ops;/** We don't need try_module_get here, as the listening socket (sock)* has the protocol module (sock->ops->owner) held.*/__module_get(newsock->ops->owner);newfd = get_unused_fd_flags(flags);/*! 2.分配一个fd给新的连接 */if(unlikely(newfd <0)){err = newfd;sock_release(newsock);goto out_put;}newfile = sock_alloc_file(newsock, flags, sock->sk->sk_prot_creator->name);/*! 3.为newsock创建一个对应的file结构 */if(unlikely(IS_ERR(newfile))){err = PTR_ERR(newfile);put_unused_fd(newfd);sock_release(newsock);goto out_put;}err = security_socket_accept(sock, newsock);if(err){goto out_fd;}err = sock->ops->accept(sock, newsock, sock->file->f_flags);/*! 4.调用Socket层操作函数inet_accept() */if(err <0){goto out_fd;}if(upeer_sockaddr){if(newsock->ops->getname(newsock,(struct sockaddr *)&address,&len,2)<0){err =-ECONNABORTED;goto out_fd;}err = move_addr_to_user(&address,len, upeer_sockaddr, upeer_addrlen);if(err <0){goto out_fd;}}/* File flags are not inherited via accept() unlike another OSes. */fd_install(newfd, newfile);err = newfd;out_put:fput_light(sock->file, fput_needed);out:return err;out_fd:fput(newfile);put_unused_fd(newfd);goto out_put;}
struct file *sock_alloc_file(struct socket *sock,int flags,constchar*dname){struct qstr name ={.name =""};struct path path;struct file *file;if(dname){name.name = dname;name.len = strlen(name.name);}elseif(sock->sk){name.name = sock->sk->sk_prot_creator->name;name.len = strlen(name.name);}path.dentry = d_alloc_pseudo(sock_mnt->mnt_sb,&name);if(unlikely(!path.dentry)){return ERR_PTR(-ENOMEM);}path.mnt = mntget(sock_mnt);d_instantiate(path.dentry, SOCK_INODE(sock));file = alloc_file(&path, FMODE_READ | FMODE_WRITE,&socket_file_ops);if(unlikely(IS_ERR(file))){/* drop dentry, keep inode */ihold(path.dentry->d_inode);path_put(&path);return file;}/*! 注意这里的属性设置 */sock->file = file;file->f_flags = O_RDWR |(flags & O_NONBLOCK);file->private_data = sock;return file;}
/** Accept a pending connection. The TCP layer now gives BSD semantics.*/// <net/ipv4/af_inet.c>int inet_accept(struct socket *sock,struct socket *newsock,int flags){struct sock *sk1 = sock->sk;int err =-EINVAL;/*** 如果使用的是TCP,则sk_prot为tcp_prot,accept为inet_csk_accept()* 获取新连接的sock。*/struct sock *sk2 = sk1->sk_prot->accept(sk1, flags,&err);/*! 4.1.获取新连接的sock */if(!sk2){goto do_err;}lock_sock(sk2);sock_rps_record_flow(sk2);WARN_ON(!((1<< sk2->sk_state)&(TCPF_ESTABLISHED | TCPF_SYN_RECV |TCPF_CLOSE_WAIT | TCPF_CLOSE)));sock_graft(sk2, newsock);/*! 4.2.把sock和socket嫁接起来,让它们能相互索引 */newsock->state = SS_CONNECTED;/*! 4.3.把新socket的状态设为已连接 */err =0;release_sock(sk2);do_err:return err;}
// <net/Sock.h>staticinlinevoid sock_graft(struct sock *sk,struct socket *parent){write_lock_bh(&sk->sk_callback_lock);sk->sk_wq = parent->wq;parent->sk = sk; /*! INET层的socket使用下层的sock服务 */sk_set_socket(sk, parent);security_sock_graft(sk, parent);write_unlock_bh(&sk->sk_callback_lock);}
// <net/ipv4/Inet_connection_sock.c>/** This will accept the next outstanding connection.*/struct sock *inet_csk_accept(struct sock *sk,int flags,int*err){struct inet_connection_sock *icsk = inet_csk(sk);struct request_sock_queue *queue=&icsk->icsk_accept_queue;struct sock *newsk;struct request_sock *req;int error;lock_sock(sk);/* We need to make sure that this socket is listening,* and that it has something pending.*/error =-EINVAL;if(sk->sk_state != TCP_LISTEN){goto out_err;}/* Find already established connection */if(reqsk_queue_empty(queue))// 没有ESTABLISHED状态的连接请求块{long timeo = sock_rcvtimeo(sk, flags & O_NONBLOCK);/* If this is a non blocking socket don't sleep */error =-EAGAIN;if(!timeo){goto out_err;}/*! 4.1.1 阻塞等待,直到有全连接。如果用户设置有等待时间,超时后会退出 */error = inet_csk_wait_for_connect(sk, timeo);if(error){goto out_err;}}/*! 从全连接队列中取出第一个established状态的连接请求块 */req = reqsk_queue_remove(queue);newsk = req->sk;sk_acceptq_removed(sk);if(sk->sk_protocol == IPPROTO_TCP &&queue->fastopenq != NULL){spin_lock_bh(&queue->fastopenq->lock);if(tcp_rsk(req)->listener){/* We are still waiting for the final ACK from 3WHS* so can't free req now. Instead, we set req->sk to* NULL to signify that the child socket is taken* so reqsk_fastopen_remove() will free the req* when 3WHS finishes (or is aborted).*/req->sk = NULL;req = NULL;}spin_unlock_bh(&queue->fastopenq->lock);}out:release_sock(sk);if(req){__reqsk_free(req);}return newsk;out_err:newsk = NULL;req = NULL;*err = error;goto out;}
// <net/ipv4/Inet_connection_sock.c>/** Wait for an incoming connection, avoid race conditions. This must be called* with the socket locked.*/staticint inet_csk_wait_for_connect(struct sock *sk,long timeo){struct inet_connection_sock *icsk = inet_csk(sk);DEFINE_WAIT(wait);int err;/** True wake-one mechanism for incoming connections: only* one process gets woken up, not the 'whole herd'.* Since we do not 'race & poll' for established sockets* anymore, the common case will execute the loop only once.** Subtle issue: "add_wait_queue_exclusive()" will be added* after any current non-exclusive waiters, and we know that* it will always _stay_ after any new non-exclusive waiters* because all non-exclusive waiters are added at the* beginning of the wait-queue. As such, it's ok to "drop"* our exclusiveness temporarily when we get woken up without* having to remove and re-insert us on the wait queue.*/for(;;){/*! 把自己加入到等待队列,并且设置自己的状态是可中断的 */prepare_to_wait_exclusive(sk_sleep(sk),&wait,TASK_INTERRUPTIBLE);release_sock(sk);if(reqsk_queue_empty(&icsk->icsk_accept_queue)){/*** 用户发起的accept操作就停schedule_timeout中* switch (timeout)* {* case MAX_SCHEDULE_TIMEOUT:* schedule();* goto out;* default:* }* 根据其实现代码,由于我们一般没有设置timeout值,所以是MAX_SCHEDULE_TIMEOUT的情况,这表示立即进入重新调度,* 而当前的进程可以处于睡眠,直到被其它事件唤醒。*/timeo = schedule_timeout(timeo);}sched_annotate_sleep();lock_sock(sk);err =0;if(!reqsk_queue_empty(&icsk->icsk_accept_queue)){break;}err =-EINVAL;if(sk->sk_state != TCP_LISTEN){break;}err = sock_intr_errno(timeo);if(signal_pending(current)){break;}err =-EAGAIN;if(!timeo){break;}}/*! 下面把任务设置成TASK_RUNNING状态,然后把当前sock从等待队列中删除 */finish_wait(sk_sleep(sk),&wait);return err;}
linux内核之accept实现的更多相关文章
- linux内核的makefile.txt讲解
linux内核的linux-3.6.5\Documentation\kbuild\makefiles.txt Linux Kernel Makefiles This document describe ...
- Linux内核参数配置
Linux在系统运行时修改内核参数(/proc/sys与/etc/sysctl.conf),而不需要重新引导系统,这个功能是通过/proc虚拟文件系统实现的. 在/proc/sys目录下存放着大多数的 ...
- Linux内核 TCP/IP、Socket参数调优
Linux内核 TCP/IP.Socket参数调优 2014-06-06 Harrison.... 阅 9611 转 165 转藏到我的图书馆 微信分享: Doc1: /proc/sy ...
- Linux内核--网络栈实现分析(一)--网络栈初始化
本文分析基于内核Linux Kernel 1.2.13 原创作品,转载请标明http://blog.csdn.net/yming0221/article/details/7488828 更多请看专栏, ...
- Linux内核Makefile文件(翻译自内核手册)
--译自Linux3.9.5 Kernel Makefiles(内核目录documention/kbuild/makefiles.txt) kbuild(kernel build) 内核编译器 Thi ...
- linux内核数据结构学习总结
目录 . 进程相关数据结构 ) struct task_struct ) struct cred ) struct pid_link ) struct pid ) struct signal_stru ...
- linux 内核参数图解
https://www.suse.com/documentation/sles11/book_sle_tuning/data/part_tuning_kernel.html http://blog.c ...
- Linux内核--网络栈实现分析(一)--网络栈初始化--转
转载地址 http://blog.csdn.net/yming0221/article/details/7488828 作者:闫明 本文分析基于内核Linux Kernel 1.2.13 以后的系列博 ...
- TCP/IP协议栈源码图解分析系列10:linux内核协议栈中对于socket相关API的实现
题记:本系列文章的目的是抛开书本从Linux内核源代码的角度详细分析TCP/IP协议栈内核相关技术 轻松搞定TCP/IP协议栈,原创文章欢迎交流, byhankswang@gmail.com linu ...
随机推荐
- opencv 应用程序无法正常启动(0xooooo7b)
#include<iostream> #include <opencv2/core/core.hpp> #include <opencv2/highgui/highgui ...
- Chapter 2(算法)
附件列表 算法.jpg
- winscp以命令行方式同步服务器数据到PC机磁盘上
目前服务器上每日会产生备份文件,需要使用winscp工具把备份同步到本地PC机硬盘上.平时都是图形界面用鼠标点击方式来同步的,效率低下,因此编写了winscp自动同步脚本,并加入到计划任务中定时自动运 ...
- python与pycharm
什么叫自动化测试? 通俗来说,自动化测试就是通过写代码来帮我们测试软件.用来做自动化测试的语言很多,python,Java,php,Go,ruby等.而且软件系统开发语言与自动化测试语言可以不一致.例 ...
- JDBC编程扩展
数据库的分类:关系型数据库.非关系型数据库.这跟数据库的发展相关.关系型数据库:mysql.oracle.sqlserver非关系型数据库:redis.memcathe.mogodb.hadoop1. ...
- RabbitMQ消息队列里积压很多消息
1.场景:上千万条消息在mq里积压了几个小时了还没解决 2.解决: 1)先修复consumer的问题,确保其恢复消费速度,然后将现有cnosumer都停掉 2)新建一个topic,partition是 ...
- angularJS 控制输入的百分数在0%-100%之间
想了老半天了,记录一下 app.directive("percentageCheck", function () { return { restrict: 'A', require ...
- 如何使用Defender优雅的管理权限?
何为权限管理 权限管理已经不知不觉深入到了我们生活的每一个角落,例如地铁进站的闸机,高速公路上的过路费,停车场的杠杆等等等等. 作为一名开发人员,权限二字对我们的映像更加深刻,无论任何系统,都多多少少 ...
- Python练习-迭代器-模拟cat|grep文件
代码如下: # 编辑者:闫龙 def grep(FindWhat): f=open("a.txt","r",encoding="utf8") ...
- 【总结】前端框架:react还是vue?
之前写了一篇前端框架的大汇总,主要介绍了当下主流的框架和其特性.最近除了bootstrap,就属react和vue最为热门,这篇就主要拿这两个框架来做一下详细对比. 究竟如何正确使用?作为小白的我们从 ...