Context Navigation

source: mainline/uspace/srv/vfs/vfs_ops.c@ 15b9970

Visit:

lfn serial ticket/834-toolchain-update topic/msim-upgrade topic/simplify-dev-export

Last change on this file since 15b9970 was 15b9970, checked in by Jakub Jermar <jakub@…>, 17 years ago
VFS_OPEN and VFS_WRITE now understand O_APPEND.
Property mode set to `100644`
File size: 15.6 KB

Line
1	/*
2	* Copyright (c) 2008 Jakub Jermar
3	* All rights reserved.
4	*
5	* Redistribution and use in source and binary forms, with or without
6	* modification, are permitted provided that the following conditions
7	* are met:
8	*
9	* - Redistributions of source code must retain the above copyright
10	* notice, this list of conditions and the following disclaimer.
11	* - Redistributions in binary form must reproduce the above copyright
12	* notice, this list of conditions and the following disclaimer in the
13	* documentation and/or other materials provided with the distribution.
14	* - The name of the author may not be used to endorse or promote products
15	* derived from this software without specific prior written permission.
16	*
17	* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18	* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19	* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20	* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21	* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22	* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23	* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24	* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25	* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26	* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27	*/
28
29	/** @addtogroup fs
30	* @{
31	*/
32
33	/**
34	* @file vfs_ops.c
35	* @brief Operations that VFS offers to its clients.
36	*/
37
38	#include <ipc/ipc.h>
39	#include <async.h>
40	#include <errno.h>
41	#include <stdio.h>
42	#include <stdlib.h>
43	#include <string.h>
44	#include <bool.h>
45	#include <futex.h>
46	#include <rwlock.h>
47	#include <libadt/list.h>
48	#include <unistd.h>
49	#include <ctype.h>
50	#include <fcntl.h>
51	#include <assert.h>
52	#include <atomic.h>
53	#include "vfs.h"
54
55	/**
56	* This rwlock prevents the race between a triplet-to-VFS-node resolution and a
57	* concurrent VFS operation which modifies the file system namespace.
58	*/
59	RWLOCK_INITIALIZE(namespace_rwlock);
60
61	atomic_t rootfs_futex = FUTEX_INITIALIZER;
62	vfs_triplet_t rootfs = {
63	.fs_handle = 0,
64	.dev_handle = 0,
65	.index = 0,
66	};
67
68	static int lookup_root(int fs_handle, int dev_handle, vfs_lookup_res_t *result)
69	{
70	vfs_pair_t altroot = {
71	.fs_handle = fs_handle,
72	.dev_handle = dev_handle,
73	};
74
75	return vfs_lookup_internal("/", strlen("/"), L_DIRECTORY, result,
76	&altroot);
77	}
78
79	void vfs_mount(ipc_callid_t rid, ipc_call_t *request)
80	{
81	int dev_handle;
82	vfs_node_t *mp_node = NULL;
83
84	/*
85	* We expect the library to do the device-name to device-handle
86	* translation for us, thus the device handle will arrive as ARG1
87	* in the request.
88	*/
89	dev_handle = IPC_GET_ARG1(*request);
90
91	/*
92	* For now, don't make use of ARG2 and ARG3, but they can be used to
93	* carry mount options in the future.
94	*/
95
96	ipc_callid_t callid;
97	size_t size;
98
99	/*
100	* Now, we expect the client to send us data with the name of the file
101	* system.
102	*/
103	if (!ipc_data_write_receive(&callid, &size)) {
104	ipc_answer_0(callid, EINVAL);
105	ipc_answer_0(rid, EINVAL);
106	return;
107	}
108
109	/*
110	* Don't receive more than is necessary for storing a full file system
111	* name.
112	*/
113	if (size < 1 \|\| size > FS_NAME_MAXLEN) {
114	ipc_answer_0(callid, EINVAL);
115	ipc_answer_0(rid, EINVAL);
116	return;
117	}
118
119	/* Deliver the file system name. */
120	char fs_name[FS_NAME_MAXLEN + 1];
121	(void) ipc_data_write_finalize(callid, fs_name, size);
122	fs_name[size] = '\0';
123
124	/*
125	* Check if we know a file system with the same name as is in fs_name.
126	* This will also give us its file system handle.
127	*/
128	int fs_handle = fs_name_to_handle(fs_name, true);
129	if (!fs_handle) {
130	ipc_answer_0(rid, ENOENT);
131	return;
132	}
133
134	/* Now, we want the client to send us the mount point. */
135	if (!ipc_data_write_receive(&callid, &size)) {
136	ipc_answer_0(callid, EINVAL);
137	ipc_answer_0(rid, EINVAL);
138	return;
139	}
140
141	/* Check whether size is reasonable wrt. the mount point. */
142	if (size < 1 \|\| size > MAX_PATH_LEN) {
143	ipc_answer_0(callid, EINVAL);
144	ipc_answer_0(rid, EINVAL);
145	return;
146	}
147	/* Allocate buffer for the mount point data being received. */
148	uint8_t *buf;
149	buf = malloc(size);
150	if (!buf) {
151	ipc_answer_0(callid, ENOMEM);
152	ipc_answer_0(rid, ENOMEM);
153	return;
154	}
155
156	/* Deliver the mount point. */
157	(void) ipc_data_write_finalize(callid, buf, size);
158
159	/*
160	* Lookup the root node of the filesystem being mounted.
161	* In this case, we don't need to take the namespace_futex as the root
162	* node cannot be removed. However, we do take a reference to it so
163	* that we can track how many times it has been mounted.
164	*/
165	int rc;
166	vfs_lookup_res_t mr_res;
167	rc = lookup_root(fs_handle, dev_handle, &mr_res);
168	if (rc != EOK) {
169	free(buf);
170	ipc_answer_0(rid, rc);
171	return;
172	}
173	vfs_node_t *mr_node = vfs_node_get(&mr_res);
174	if (!mr_node) {
175	free(buf);
176	ipc_answer_0(rid, ENOMEM);
177	return;
178	}
179
180	/* Finally, we need to resolve the path to the mountpoint. */
181	vfs_lookup_res_t mp_res;
182	futex_down(&rootfs_futex);
183	if (rootfs.fs_handle) {
184	/* We already have the root FS. */
185	rwlock_write_lock(&namespace_rwlock);
186	rc = vfs_lookup_internal(buf, size, L_DIRECTORY, &mp_res,
187	NULL);
188	if (rc != EOK) {
189	/* The lookup failed for some reason. */
190	rwlock_write_unlock(&namespace_rwlock);
191	futex_up(&rootfs_futex);
192	vfs_node_put(mr_node); /* failed -> drop reference */
193	free(buf);
194	ipc_answer_0(rid, rc);
195	return;
196	}
197	mp_node = vfs_node_get(&mp_res);
198	if (!mp_node) {
199	rwlock_write_unlock(&namespace_rwlock);
200	futex_up(&rootfs_futex);
201	vfs_node_put(mr_node); /* failed -> drop reference */
202	free(buf);
203	ipc_answer_0(rid, ENOMEM);
204	return;
205	}
206	/*
207	* Now we hold a reference to mp_node.
208	* It will be dropped upon the corresponding VFS_UNMOUNT.
209	* This prevents the mount point from being deleted.
210	*/
211	rwlock_write_unlock(&namespace_rwlock);
212	} else {
213	/* We still don't have the root file system mounted. */
214	if ((size == 1) && (buf[0] == '/')) {
215	/* For this simple, but important case, we are done. */
216	rootfs = mr_res.triplet;
217	futex_up(&rootfs_futex);
218	free(buf);
219	ipc_answer_0(rid, EOK);
220	return;
221	} else {
222	/*
223	* We can't resolve this without the root filesystem
224	* being mounted first.
225	*/
226	futex_up(&rootfs_futex);
227	free(buf);
228	vfs_node_put(mr_node); /* failed -> drop reference */
229	ipc_answer_0(rid, ENOENT);
230	return;
231	}
232	}
233	futex_up(&rootfs_futex);
234
235	free(buf); /* The buffer is not needed anymore. */
236
237	/*
238	* At this point, we have all necessary pieces: file system and device
239	* handles, and we know the mount point VFS node and also the root node
240	* of the file system being mounted.
241	*/
242
243	int phone = vfs_grab_phone(mp_res.triplet.fs_handle);
244	/* Later we can use ARG3 to pass mode/flags. */
245	aid_t req1 = async_send_3(phone, VFS_MOUNT,
246	(ipcarg_t) mp_res.triplet.dev_handle,
247	(ipcarg_t) mp_res.triplet.index, 0, NULL);
248	/* The second call uses the same method. */
249	aid_t req2 = async_send_3(phone, VFS_MOUNT,
250	(ipcarg_t) mr_res.triplet.fs_handle,
251	(ipcarg_t) mr_res.triplet.dev_handle,
252	(ipcarg_t) mr_res.triplet.index, NULL);
253	vfs_release_phone(phone);
254
255	ipcarg_t rc1;
256	ipcarg_t rc2;
257	async_wait_for(req1, &rc1);
258	async_wait_for(req2, &rc2);
259
260	if ((rc1 != EOK) \|\| (rc2 != EOK)) {
261	/* Mount failed, drop references to mr_node and mp_node. */
262	vfs_node_put(mr_node);
263	if (mp_node)
264	vfs_node_put(mp_node);
265	}
266
267	if (rc2 == EOK)
268	ipc_answer_0(rid, rc1);
269	else if (rc1 == EOK)
270	ipc_answer_0(rid, rc2);
271	else
272	ipc_answer_0(rid, rc1);
273	}
274
275	void vfs_open(ipc_callid_t rid, ipc_call_t *request)
276	{
277	if (!vfs_files_init()) {
278	ipc_answer_0(rid, ENOMEM);
279	return;
280	}
281
282	/*
283	* The POSIX interface is open(path, oflag, mode).
284	* We can receive oflags and mode along with the VFS_OPEN call; the path
285	* will need to arrive in another call.
286	*
287	* We also receive one private, non-POSIX set of flags called lflag
288	* used to pass information to vfs_lookup_internal().
289	*/
290	int lflag = IPC_GET_ARG1(*request);
291	int oflag = IPC_GET_ARG2(*request);
292	int mode = IPC_GET_ARG3(*request);
293	size_t len;
294
295	if (oflag & O_CREAT)
296	lflag \|= L_CREATE;
297	if (oflag & O_EXCL)
298	lflag \|= L_EXCLUSIVE;
299
300	ipc_callid_t callid;
301
302	if (!ipc_data_write_receive(&callid, &len)) {
303	ipc_answer_0(callid, EINVAL);
304	ipc_answer_0(rid, EINVAL);
305	return;
306	}
307
308	/*
309	* Now we are on the verge of accepting the path.
310	*
311	* There is one optimization we could do in the future: copy the path
312	* directly into the PLB using some kind of a callback.
313	*/
314	char *path = malloc(len);
315
316	if (!path) {
317	ipc_answer_0(callid, ENOMEM);
318	ipc_answer_0(rid, ENOMEM);
319	return;
320	}
321
322	int rc;
323	if ((rc = ipc_data_write_finalize(callid, path, len))) {
324	ipc_answer_0(rid, rc);
325	free(path);
326	return;
327	}
328
329	/*
330	* Avoid the race condition in which the file can be deleted before we
331	* find/create-and-lock the VFS node corresponding to the looked-up
332	* triplet.
333	*/
334	if (lflag & L_CREATE)
335	rwlock_write_lock(&namespace_rwlock);
336	else
337	rwlock_read_lock(&namespace_rwlock);
338
339	/* The path is now populated and we can call vfs_lookup_internal(). */
340	vfs_lookup_res_t lr;
341	rc = vfs_lookup_internal(path, len, lflag, &lr, NULL);
342	if (rc) {
343	if (lflag & L_CREATE)
344	rwlock_write_unlock(&namespace_rwlock);
345	else
346	rwlock_read_unlock(&namespace_rwlock);
347	ipc_answer_0(rid, rc);
348	free(path);
349	return;
350	}
351
352	/** Path is no longer needed. */
353	free(path);
354
355	vfs_node_t *node = vfs_node_get(&lr);
356	if (lflag & L_CREATE)
357	rwlock_write_unlock(&namespace_rwlock);
358	else
359	rwlock_read_unlock(&namespace_rwlock);
360
361	/*
362	* Get ourselves a file descriptor and the corresponding vfs_file_t
363	* structure.
364	*/
365	int fd = vfs_fd_alloc();
366	if (fd < 0) {
367	vfs_node_put(node);
368	ipc_answer_0(rid, fd);
369	return;
370	}
371	vfs_file_t *file = vfs_file_get(fd);
372	file->node = node;
373	if (oflag & O_APPEND)
374	file->append = true;
375
376	/*
377	* The following increase in reference count is for the fact that the
378	* file is being opened and that a file structure is pointing to it.
379	* It is necessary so that the file will not disappear when
380	* vfs_node_put() is called. The reference will be dropped by the
381	* respective VFS_CLOSE.
382	*/
383	vfs_node_addref(node);
384	vfs_node_put(node);
385
386	/* Success! Return the new file descriptor to the client. */
387	ipc_answer_1(rid, EOK, fd);
388	}
389
390	static void vfs_rdwr(ipc_callid_t rid, ipc_call_t *request, bool read)
391	{
392
393	/*
394	* The following code strongly depends on the fact that the files data
395	* structure can be only accessed by a single fibril and all file
396	* operations are serialized (i.e. the reads and writes cannot
397	* interleave and a file cannot be closed while it is being read).
398	*
399	* Additional synchronization needs to be added once the table of
400	* open files supports parallel access!
401	*/
402
403	int fd = IPC_GET_ARG1(*request);
404
405	/* Lookup the file structure corresponding to the file descriptor. */
406	vfs_file_t *file = vfs_file_get(fd);
407	if (!file) {
408	ipc_answer_0(rid, ENOENT);
409	return;
410	}
411
412	/*
413	* Now we need to receive a call with client's
414	* IPC_M_DATA_READ/IPC_M_DATA_WRITE request.
415	*/
416	ipc_callid_t callid;
417	int res;
418	if (read)
419	res = ipc_data_read_receive(&callid, NULL);
420	else
421	res = ipc_data_write_receive(&callid, NULL);
422	if (!res) {
423	ipc_answer_0(callid, EINVAL);
424	ipc_answer_0(rid, EINVAL);
425	return;
426	}
427
428	/*
429	* Lock the open file structure so that no other thread can manipulate
430	* the same open file at a time.
431	*/
432	futex_down(&file->lock);
433
434	/*
435	* Lock the file's node so that no other client can read/write to it at
436	* the same time.
437	*/
438	if (read)
439	rwlock_read_lock(&file->node->contents_rwlock);
440	else
441	rwlock_write_lock(&file->node->contents_rwlock);
442
443	int fs_phone = vfs_grab_phone(file->node->fs_handle);
444
445	/* Make a VFS_READ/VFS_WRITE request at the destination FS server. */
446	aid_t msg;
447	ipc_call_t answer;
448	if (!read && file->append)
449	file->pos = file->node->size;
450	msg = async_send_3(fs_phone, IPC_GET_METHOD(*request),
451	file->node->dev_handle, file->node->index, file->pos, &answer);
452
453	/*
454	* Forward the IPC_M_DATA_READ/IPC_M_DATA_WRITE request to the
455	* destination FS server. The call will be routed as if sent by
456	* ourselves. Note that call arguments are immutable in this case so we
457	* don't have to bother.
458	*/
459	ipc_forward_fast(callid, fs_phone, 0, 0, 0, IPC_FF_ROUTE_FROM_ME);
460
461	vfs_release_phone(fs_phone);
462
463	/* Wait for reply from the FS server. */
464	ipcarg_t rc;
465	async_wait_for(msg, &rc);
466	size_t bytes = IPC_GET_ARG1(answer);
467
468	/* Unlock the VFS node. */
469	if (read)
470	rwlock_read_unlock(&file->node->contents_rwlock);
471	else {
472	/* Update the cached version of node's size. */
473	file->node->size = IPC_GET_ARG2(answer);
474	rwlock_write_unlock(&file->node->contents_rwlock);
475	}
476
477	/* Update the position pointer and unlock the open file. */
478	file->pos += bytes;
479	futex_up(&file->lock);
480
481	/*
482	* FS server's reply is the final result of the whole operation we
483	* return to the client.
484	*/
485	ipc_answer_1(rid, rc, bytes);
486	}
487
488	void vfs_read(ipc_callid_t rid, ipc_call_t *request)
489	{
490	vfs_rdwr(rid, request, true);
491	}
492
493	void vfs_write(ipc_callid_t rid, ipc_call_t *request)
494	{
495	vfs_rdwr(rid, request, false);
496	}
497
498	void vfs_seek(ipc_callid_t rid, ipc_call_t *request)
499	{
500	int fd = (int) IPC_GET_ARG1(*request);
501	off_t off = (off_t) IPC_GET_ARG2(*request);
502	int whence = (int) IPC_GET_ARG3(*request);
503
504
505	/* Lookup the file structure corresponding to the file descriptor. */
506	vfs_file_t *file = vfs_file_get(fd);
507	if (!file) {
508	ipc_answer_0(rid, ENOENT);
509	return;
510	}
511
512	off_t newpos;
513	futex_down(&file->lock);
514	if (whence == SEEK_SET) {
515	file->pos = off;
516	futex_up(&file->lock);
517	ipc_answer_1(rid, EOK, off);
518	return;
519	}
520	if (whence == SEEK_CUR) {
521	if (file->pos + off < file->pos) {
522	futex_up(&file->lock);
523	ipc_answer_0(rid, EOVERFLOW);
524	return;
525	}
526	file->pos += off;
527	newpos = file->pos;
528	futex_up(&file->lock);
529	ipc_answer_1(rid, EOK, newpos);
530	return;
531	}
532	if (whence == SEEK_END) {
533	rwlock_read_lock(&file->node->contents_rwlock);
534	size_t size = file->node->size;
535	rwlock_read_unlock(&file->node->contents_rwlock);
536	if (size + off < size) {
537	futex_up(&file->lock);
538	ipc_answer_0(rid, EOVERFLOW);
539	return;
540	}
541	newpos = size + off;
542	futex_up(&file->lock);
543	ipc_answer_1(rid, EOK, newpos);
544	return;
545	}
546	futex_up(&file->lock);
547	ipc_answer_0(rid, EINVAL);
548	}
549
550	void vfs_truncate(ipc_callid_t rid, ipc_call_t *request)
551	{
552	int fd = IPC_GET_ARG1(*request);
553	size_t size = IPC_GET_ARG2(*request);
554	ipcarg_t rc;
555
556	vfs_file_t *file = vfs_file_get(fd);
557	if (!file) {
558	ipc_answer_0(rid, ENOENT);
559	return;
560	}
561	futex_down(&file->lock);
562
563	rwlock_write_lock(&file->node->contents_rwlock);
564	int fs_phone = vfs_grab_phone(file->node->fs_handle);
565	rc = async_req_3_0(fs_phone, VFS_TRUNCATE,
566	(ipcarg_t)file->node->dev_handle, (ipcarg_t)file->node->index,
567	(ipcarg_t)size);
568	vfs_release_phone(fs_phone);
569	if (rc == EOK)
570	file->node->size = size;
571	rwlock_write_unlock(&file->node->contents_rwlock);
572
573	futex_up(&file->lock);
574	ipc_answer_0(rid, rc);
575	}
576
577	void vfs_mkdir(ipc_callid_t rid, ipc_call_t *request)
578	{
579	int mode = IPC_GET_ARG1(*request);
580	size_t len;
581
582	ipc_callid_t callid;
583
584	if (!ipc_data_write_receive(&callid, &len)) {
585	ipc_answer_0(callid, EINVAL);
586	ipc_answer_0(rid, EINVAL);
587	return;
588	}
589
590	/*
591	* Now we are on the verge of accepting the path.
592	*
593	* There is one optimization we could do in the future: copy the path
594	* directly into the PLB using some kind of a callback.
595	*/
596	char *path = malloc(len);
597
598	if (!path) {
599	ipc_answer_0(callid, ENOMEM);
600	ipc_answer_0(rid, ENOMEM);
601	return;
602	}
603
604	int rc;
605	if ((rc = ipc_data_write_finalize(callid, path, len))) {
606	ipc_answer_0(rid, rc);
607	free(path);
608	return;
609	}
610
611	rwlock_write_lock(&namespace_rwlock);
612	int lflag = L_DIRECTORY \| L_CREATE \| L_EXCLUSIVE;
613	rc = vfs_lookup_internal(path, len, lflag, NULL, NULL);
614	rwlock_write_unlock(&namespace_rwlock);
615	free(path);
616	ipc_answer_0(rid, rc);
617	}
618
619	/**
620	* @}
621	*/

Note: See TracBrowser for help on using the repository browser.

Download in other formats: