首页 \ 问答 \ 大文件上的aio_write(aio_write on Large Files)

大文件上的aio_write(aio_write on Large Files)

 我试图用aio_read(3)和aio_write(3)以异步的方式模仿sendfile(2)的功能。  
 除了测试大型（> 150k）文件外，一切似乎都正常工作。  
 我有一个简单的struct io_request用于跟踪传输：  
struct io_request {
    int status;
    struct aiocb *aiocbp;
    int sfd;
};
 
 首先，我建立了aio_read()调用：  
struct io_request * ioreq = malloc(sizeof(struct io_request));
ioreq->status = EINPROGRESS;
ioreq->sfd = sfd;

struct aiocb * aiocbreq = malloc(sizeof(struct aiocb));
memset(aiocbreq, 0, sizeof(struct aiocb));

ioreq->aiocbp = aiocbreq;

ioreq->aiocbp->aio_fildes = ffd;

if (ioreq->aiocbp->aio_fildes == -1) {
    perror("aio_fildes");
}

ioreq->aiocbp->aio_buf = malloc(st.st_size);
if (ioreq->aiocbp->aio_buf == NULL) {
    perror("aio_buf malloc");
}

ioreq->aiocbp->aio_nbytes = st.st_size;
ioreq->aiocbp->aio_reqprio = 0;
ioreq->aiocbp->aio_offset = 0;
ioreq->aiocbp->aio_sigevent.sigev_signo = IO_READ_SIGNAL;
ioreq->aiocbp->aio_sigevent.sigev_value.sival_ptr = ioreq;
if (aio_read(ioreq->aiocbp) == -1) {
    perror("aio_read");
}
 
 然后在IO_READ_SIGNAL处理程序中捕获IO_READ_SIGNAL ：  
static void
aio_read_handler(int sig, siginfo_t *si, void *ucontext)
{
    if (si->si_code == SI_ASYNCIO) {
        struct io_request *ioreq = si->si_value.sival_ptr;

        // Build the AIO write request
        struct aiocb aiocbreq;
        memset(&aiocbreq, 0, sizeof(struct aiocb));
        aiocbreq.aio_fildes = ioreq->sfd;
        aiocbreq.aio_buf = ioreq->aiocbp->aio_buf;
        aiocbreq.aio_nbytes = ioreq->aiocbp->aio_nbytes;
        aiocbreq.aio_sigevent.sigev_signo = IO_WRITE_SIGNAL;
        aiocbreq.aio_sigevent.sigev_value.sival_ptr = ioreq;

        if (aio_write((void *) &aiocbreq) == -1) {
            perror("aio_write");
        }
    }
}
 
 我可以确认在处理程序内部，即使是大文件， ioreq->aiocbp->aio_buf的内容也是完整且完整的。  
 稍后，将在IO_WRITE_SIGNAL处理程序中捕获aio_write() ：  
static void
aio_write_handler(int sig, siginfo_t *si, void *ucontext)
{
    if (si->si_code == SI_ASYNCIO) {
        struct io_request *ioreq = si->si_value.sival_ptr;

        ssize_t bytes_written = aio_return(ioreq->aiocbp);
        printf("Wrote %zu of %zu bytes\n", bytes_written, ioreq->aiocbp->aio_nbytes);
        //free(ioreq->aiocbp);
        //free(ioreq);

        if (aio_error(ioreq->aiocbp) != 0) {
            perror("aio_write_handler");
        }
    }
}
 
 此时aio_write()应该已经完成。 我检查返回值并据此采取行动。 这两个调用都会报告已写入的相应字节数，并且在写入期间不会出现错误。  
 更大的应用程序是一个HTTP服务器。 我推测这个问题是由于远程客户端无法快速读取以跟上aio_write() 。 当我有一个sendfile()实现时，我不得不多次调用sendfile()来完成文件传输。  
 几个直接的问题：  
 
  为什么aio_return()和aio_error()不报告任何问题？  
  我该如何解决这个问题？  
  有没有办法缓冲aio_write() ？ 我正在考虑n_bytes传递给aio_write() struct aiocb的n_bytes ，并在aio_write()多次调用aio_write_handler() 。  
 
 谢谢你的帮助！ 

I'm trying to essentially mimic the functionality of sendfile(2) in an asynchronous fashion using aio_read(3) and aio_write(3). 
Everything seems to be working fine, with the exception of testing large (> 150k) files. 
I have a simple struct io_request I am using to keep track of the transfers: 
struct io_request {
    int status;
    struct aiocb *aiocbp;
    int sfd;
};
 
First, I build the aio_read() call: 
struct io_request * ioreq = malloc(sizeof(struct io_request));
ioreq->status = EINPROGRESS;
ioreq->sfd = sfd;

struct aiocb * aiocbreq = malloc(sizeof(struct aiocb));
memset(aiocbreq, 0, sizeof(struct aiocb));

ioreq->aiocbp = aiocbreq;

ioreq->aiocbp->aio_fildes = ffd;

if (ioreq->aiocbp->aio_fildes == -1) {
    perror("aio_fildes");
}

ioreq->aiocbp->aio_buf = malloc(st.st_size);
if (ioreq->aiocbp->aio_buf == NULL) {
    perror("aio_buf malloc");
}

ioreq->aiocbp->aio_nbytes = st.st_size;
ioreq->aiocbp->aio_reqprio = 0;
ioreq->aiocbp->aio_offset = 0;
ioreq->aiocbp->aio_sigevent.sigev_signo = IO_READ_SIGNAL;
ioreq->aiocbp->aio_sigevent.sigev_value.sival_ptr = ioreq;
if (aio_read(ioreq->aiocbp) == -1) {
    perror("aio_read");
}
 
Which then later is captured in a IO_READ_SIGNAL handler: 
static void
aio_read_handler(int sig, siginfo_t *si, void *ucontext)
{
    if (si->si_code == SI_ASYNCIO) {
        struct io_request *ioreq = si->si_value.sival_ptr;

        // Build the AIO write request
        struct aiocb aiocbreq;
        memset(&aiocbreq, 0, sizeof(struct aiocb));
        aiocbreq.aio_fildes = ioreq->sfd;
        aiocbreq.aio_buf = ioreq->aiocbp->aio_buf;
        aiocbreq.aio_nbytes = ioreq->aiocbp->aio_nbytes;
        aiocbreq.aio_sigevent.sigev_signo = IO_WRITE_SIGNAL;
        aiocbreq.aio_sigevent.sigev_value.sival_ptr = ioreq;

        if (aio_write((void *) &aiocbreq) == -1) {
            perror("aio_write");
        }
    }
}
 
I can confirm that inside the handler, even for large files, the contents of ioreq->aiocbp->aio_buf is full and complete. 
Later, the aio_write() is captured in a IO_WRITE_SIGNAL handler: 
static void
aio_write_handler(int sig, siginfo_t *si, void *ucontext)
{
    if (si->si_code == SI_ASYNCIO) {
        struct io_request *ioreq = si->si_value.sival_ptr;

        ssize_t bytes_written = aio_return(ioreq->aiocbp);
        printf("Wrote %zu of %zu bytes\n", bytes_written, ioreq->aiocbp->aio_nbytes);
        //free(ioreq->aiocbp);
        //free(ioreq);

        if (aio_error(ioreq->aiocbp) != 0) {
            perror("aio_write_handler");
        }
    }
}
 
At this point aio_write() should have been completed. I check the return values and act accordingly. Both calls report the appropriate number of bytes have been written and no errors arose during the write. 
The greater application is an HTTP server. I speculate that this problem arrises because the remote client cannot read fast enough to keep up with the aio_write(). When I had a sendfile() implementation of this, I had to call sendfile() multiple times to complete the file transfer. 
Several direct questions: 
 
 Why does aio_return() and aio_error() not report any problems? 
 How can I fix this behavior? 
 Are there ways to buffer aio_write()? I was thinking of capping of n_bytes inside struct aiocb passed to aio_write(), and just calling aio_write() multiple times from inside aio_write_handler(). 
 
Thanks for your help!

原文：https://stackoverflow.com/questions/41046769

更新时间：2023-09-24 06:09

最满意答案

 我们可以按值传递参数的原因完全相同 - 如果您需要副本，请按值获取。  
 
  我无法想象通过显式创建副本而不是为您执行循环而无法解决的任何问题。  
 
 我认为这是你遇到的主要问题。 循环不是“为你做”。 这是明确要求副本。 什么比初始化非参考变量更明确？  
 这实际上只是一个普通的声明。 为什么，当它在其他地方都有效时，我们会让auto本身无效吗？ 实际上，该声明的初始化由标准定义为：  
auto x = *__begin;
 
 其中__begin是赋予范围的第一个元素的迭代器的表达式（在本例中为v.begin() ）。 这与C ++中的任何其他复制没有什么不同。 你会认为以下是一个常见的错误吗？  
int x = some_other_int;
 
 要么：  
std::string str = some_other_string;
 
 不，当我们想要一份副本时，我们会写一个这样的声明。  
 这是一个用例示例：  
void modify_argument(X&);
void use(X);

// ...

std::vector<X> v = /* ... */;
for (auto x : v) {
  // We want to modify the copy of x, but not the original:
  modify_argument(x);
  use(x);
}

Exactly the same reason we can pass arguments by value - if you need a copy, take it by value.  
 
 I can't imagine anything that can not be solved by just creating a copy explicitly instead of the loop doing it for you. 
 
I think this is the main issue you're having. The loop isn't "doing it for you". This is asking for a copy explicitly. What's more explicit than initialising a non-reference variable? 
This is really just a normal declaration. Why, when it is valid everywhere else, would we make auto by itself be invalid here? In fact, the initialization of this declaration is defined by the standard as: 
auto x = *__begin;
 
where __begin is the expression giving an iterator to the first element of the range (in this case v.begin()). This is no different to any other copying in C++. Would you consider the following to be a common mistake? 
int x = some_other_int;
 
Or: 
std::string str = some_other_string;
 
No, we write a declaration like this when we want a copy. 
Here's an example use case: 
void modify_argument(X&);
void use(X);

// ...

std::vector<X> v = /* ... */;
for (auto x : v) {
  // We want to modify the copy of x, but not the original:
  modify_argument(x);
  use(x);
}

大文件上的aio_write(aio_write on Large Files)

最满意答案

相关问答

在Qt中正确使用C ++ 11基于范围的for循环(Using C++11 range-based for loop correctly in Qt)[2022-09-11]

C ++ 11反向范围的for-loop(C++11 reverse range-based for-loop)[2022-05-30]

C ++ 11基于范围的for循环，没有循环变量(C++11 range-based for loops without loop variable)[2022-06-14]

允许基于范围的枚举类？(Allow for Range-Based For with enum classes?)[2023-01-26]

使用C ++ 11的基于范围的正确方法是什么？(What is the correct way of using C++11's range-based for?)[2023-07-29]

为什么在C ++ 11的基于范围的情况下需要按值获取(Why is capturing by value needed in C++11's range-based for)[2022-03-07]

C ++ 11基于范围的for循环派生对象(C++11 range-based for loop on derived objects)[2022-08-12]

基于范围的for循环中的C ++ 11重新声明(C++11 redeclaration in range-based for loop)[2022-04-09]

如何使用基于C ++ 11范围的QJsonArray(How to use C++11 range-based for with QJsonArray)[2024-01-13]

如何在char * argv []上执行基于范围的c ++ 11 for循环？(How to perform a range-based c++11 for loop on char* argv[]?)[2024-01-12]

相关文章

最新问答