Do not set O_NONBLOCK on a threaded program's descriptors any more. Instead,
[dragonfly.git] / lib / libc_r / uthread / uthread_writev.c
1 /*
2  * Copyright (c) 1995-1998 John Birrell <jb@cimlogic.com.au>
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  * 1. Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  * 2. Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in the
12  *    documentation and/or other materials provided with the distribution.
13  * 3. All advertising materials mentioning features or use of this software
14  *    must display the following acknowledgement:
15  *      This product includes software developed by John Birrell.
16  * 4. Neither the name of the author nor the names of any co-contributors
17  *    may be used to endorse or promote products derived from this software
18  *    without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY JOHN BIRRELL AND CONTRIBUTORS ``AS IS'' AND
21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30  * SUCH DAMAGE.
31  *
32  * $FreeBSD: src/lib/libc_r/uthread/uthread_writev.c,v 1.16.2.6 2002/11/15 18:39:21 archie Exp $
33  * $DragonFly: src/lib/libc_r/uthread/uthread_writev.c,v 1.3 2006/06/14 01:45:28 dillon Exp $
34  *
35  */
36 #include <sys/types.h>
37 #include <sys/fcntl.h>
38 #include <sys/uio.h>
39 #include <errno.h>
40 #include <stdlib.h>
41 #include <string.h>
42 #include <unistd.h>
43 #include <pthread.h>
44 #include "pthread_private.h"
45
46 ssize_t
47 _writev(int fd, const struct iovec * iov, int iovcnt)
48 {
49         struct pthread  *curthread = _get_curthread();
50         int     blocking;
51         int     idx = 0;
52         int     type;
53         ssize_t cnt;
54         ssize_t n;
55         ssize_t num = 0;
56         ssize_t ret;
57         struct iovec liov[20];
58         struct iovec *p_iov = liov;
59
60         /* Check if the array size exceeds to compiled in size: */
61         if (iovcnt > (sizeof(liov) / sizeof(struct iovec))) {
62                 /* Allocate memory for the local array: */
63                 if ((p_iov = (struct iovec *)
64                     malloc(iovcnt * sizeof(struct iovec))) == NULL) {
65                         /* Insufficient memory: */
66                         errno = ENOMEM;
67                         return (-1);
68                 }
69         }
70
71         /* Copy the caller's array so that it can be modified locally: */
72         memcpy(p_iov,iov,iovcnt * sizeof(struct iovec));
73
74         /* Lock the file descriptor for write: */
75         if ((ret = _FD_LOCK(fd, FD_WRITE, NULL)) == 0) {
76                 /* Get the read/write mode type: */
77                 type = _thread_fd_getflags(fd) & O_ACCMODE;
78
79                 /* Check if the file is not open for write: */
80                 if (type != O_WRONLY && type != O_RDWR) {
81                         /* File is not open for write: */
82                         errno = EBADF;
83                         _FD_UNLOCK(fd, FD_WRITE);
84                         return (-1);
85                 }
86
87                 /* Check if file operations are to block */
88                 blocking = ((_thread_fd_getflags(fd) & O_NONBLOCK) == 0);
89
90                 /*
91                  * Loop while no error occurs and until the expected number
92                  * of bytes are written if performing a blocking write:
93                  */
94                 while (ret == 0) {
95                         /* Perform a non-blocking write syscall: */
96                         n = __sys___pwritev(fd, &p_iov[idx], iovcnt - idx, O_FNONBLOCKING, -1);
97
98                         /* Check if one or more bytes were written: */
99                         if (n > 0) {
100                                 /*
101                                  * Keep a count of the number of bytes
102                                  * written:
103                                  */
104                                 num += n;
105
106                                 /*
107                                  * Enter a loop to check if a short write
108                                  * occurred and move the index to the
109                                  * array entry where the short write
110                                  * ended:
111                                  */
112                                 cnt = n;
113                                 while (cnt > 0 && idx < iovcnt) {
114                                         /*
115                                          * If the residual count exceeds
116                                          * the size of this vector, then
117                                          * it was completely written:
118                                          */
119                                         if (cnt >= p_iov[idx].iov_len)
120                                                 /*
121                                                  * Decrement the residual
122                                                  * count and increment the
123                                                  * index to the next array
124                                                  * entry:
125                                                  */
126                                                 cnt -= p_iov[idx++].iov_len;
127                                         else {
128                                                 /*
129                                                  * This entry was only
130                                                  * partially written, so
131                                                  * adjust it's length
132                                                  * and base pointer ready
133                                                  * for the next write:
134                                                  */
135                                                 p_iov[idx].iov_len -= cnt;
136                                                 p_iov[idx].iov_base += cnt;
137                                                 cnt = 0;
138                                         }
139                                 }
140                         } else if (n == 0) {
141                                 /*
142                                  * Avoid an infinite loop if the last iov_len is
143                                  * 0.
144                                  */
145                                 while (idx < iovcnt && p_iov[idx].iov_len == 0)
146                                         idx++;
147
148                                 if (idx == iovcnt) {
149                                         ret = num;
150                                         break;
151                                 }
152                         }
153                        
154                         /*
155                          * If performing a blocking write, check if the
156                          * write would have blocked or if some bytes
157                          * were written but there are still more to
158                          * write:
159                          */
160                         if (blocking && ((n < 0 && (errno == EWOULDBLOCK ||
161                             errno == EAGAIN)) || (n >= 0 && idx < iovcnt))) {
162                                 curthread->data.fd.fd = fd;
163                                 _thread_kern_set_timeout(NULL);
164
165                                 /* Reset the interrupted operation flag: */
166                                 curthread->interrupted = 0;
167
168                                 _thread_kern_sched_state(PS_FDW_WAIT,
169                                     __FILE__, __LINE__);
170
171                                 /*
172                                  * Check if the operation was
173                                  * interrupted by a signal
174                                  */
175                                 if (curthread->interrupted) {
176                                         if (num > 0) {
177                                                 /* Return partial success: */
178                                                 ret = num;
179                                         } else {
180                                                 /* Return an error: */
181                                                 errno = EINTR;
182                                                 ret = -1;
183                                         }
184                                 }
185
186                         /*
187                          * If performing a non-blocking write,
188                          * just return whatever the write syscall did:
189                          */
190                         } else if (!blocking) {
191                                 /* A non-blocking call might return zero: */
192                                 ret = n;
193                                 break;
194
195                         /*
196                          * If there was an error, return partial success
197                          * (if any bytes were written) or else the error:
198                          */
199                         } else if (n < 0) {
200                                 if (num > 0)
201                                         ret = num;
202                                 else
203                                         ret = n;
204
205                         /* Check if the write has completed: */
206                         } else if (idx == iovcnt)
207                                 /* Return the number of bytes written: */
208                                 ret = num;
209                 }
210                 _FD_UNLOCK(fd, FD_RDWR);
211         }
212
213         /* If memory was allocated for the array, free it: */
214         if (p_iov != liov)
215                 free(p_iov);
216
217         return (ret);
218 }
219
220 ssize_t
221 writev(int fd, const struct iovec *iov, int iovcnt)
222 {
223         ssize_t ret;
224
225         _thread_enter_cancellation_point();
226         ret = _writev(fd, iov, iovcnt);
227         _thread_leave_cancellation_point();
228
229         return ret;
230 }