1 | /*
|
---|
2 | * Copyright (c) 2025 Miroslav Cimerman
|
---|
3 | * All rights reserved.
|
---|
4 | *
|
---|
5 | * Redistribution and use in source and binary forms, with or without
|
---|
6 | * modification, are permitted provided that the following conditions
|
---|
7 | * are met:
|
---|
8 | *
|
---|
9 | * - Redistributions of source code must retain the above copyright
|
---|
10 | * notice, this list of conditions and the following disclaimer.
|
---|
11 | * - Redistributions in binary form must reproduce the above copyright
|
---|
12 | * notice, this list of conditions and the following disclaimer in the
|
---|
13 | * documentation and/or other materials provided with the distribution.
|
---|
14 | * - The name of the author may not be used to endorse or promote products
|
---|
15 | * derived from this software without specific prior written permission.
|
---|
16 | *
|
---|
17 | * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
|
---|
18 | * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
|
---|
19 | * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
|
---|
20 | * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
|
---|
21 | * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
|
---|
22 | * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
---|
23 | * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
---|
24 | * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
---|
25 | * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
|
---|
26 | * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
---|
27 | */
|
---|
28 |
|
---|
29 | /** @addtogroup hr
|
---|
30 | * @{
|
---|
31 | */
|
---|
32 | /**
|
---|
33 | * @file
|
---|
34 | */
|
---|
35 |
|
---|
36 | #ifndef _HR_VAR_H
|
---|
37 | #define _HR_VAR_H
|
---|
38 |
|
---|
39 | #include <adt/list.h>
|
---|
40 | #include <bd_srv.h>
|
---|
41 | #include <errno.h>
|
---|
42 | #include <fibril_synch.h>
|
---|
43 | #include <hr.h>
|
---|
44 | #include <stdatomic.h>
|
---|
45 |
|
---|
46 | #include "fge.h"
|
---|
47 | #include "superblock.h"
|
---|
48 |
|
---|
49 | #define NAME "hr"
|
---|
50 | #define HR_STRIP_SIZE DATA_XFER_LIMIT
|
---|
51 |
|
---|
52 | #define HR_RAID1_READ_STRATEGY_SPLIT
|
---|
53 | #define HR_RAID1_READ_STRATEGY_SPLIT_THRESHOLD (1024 * 1)
|
---|
54 |
|
---|
55 | /* #define HR_RAID1_READ_STRATEGY_CLOSEST */
|
---|
56 | /* #define HR_RAID1_READ_STRATEGY_ROUND_ROBIN */
|
---|
57 | /* #define HR_RAID1_READ_STRATEGY_FIRST */
|
---|
58 |
|
---|
59 | #if !defined(HR_RAID1_READ_STRATEGY_ROUND_ROBIN) && \
|
---|
60 | !defined(HR_RAID1_READ_STRATEGY_CLOSEST) && \
|
---|
61 | !defined(HR_RAID1_READ_STRATEGY_FIRST) && \
|
---|
62 | (!defined(HR_RAID1_READ_STRATEGY_SPLIT) && \
|
---|
63 | !defined(HR_RAID1_READ_STRATEGY_SPLIT_THRESHOLD))
|
---|
64 | #error "Some RAID 1 read strategy must be used"
|
---|
65 | #endif
|
---|
66 |
|
---|
67 | /*
|
---|
68 | * During a rebuild operation, we save the rebuild
|
---|
69 | * position this each many bytes. Currently each
|
---|
70 | * 10 MiB.
|
---|
71 | */
|
---|
72 | #define HR_REBUILD_SAVE_BYTES (10U * 1024 * 1024)
|
---|
73 |
|
---|
74 | struct hr_volume;
|
---|
75 | typedef struct hr_volume hr_volume_t;
|
---|
76 | typedef struct hr_stripe hr_stripe_t;
|
---|
77 | typedef struct hr_metadata hr_metadata_t;
|
---|
78 | typedef struct hr_superblock_ops hr_superblock_ops_t;
|
---|
79 |
|
---|
80 | typedef struct hr_ops {
|
---|
81 | errno_t (*create)(hr_volume_t *);
|
---|
82 | errno_t (*init)(hr_volume_t *);
|
---|
83 | void (*vol_state_eval)(hr_volume_t *);
|
---|
84 | void (*ext_state_cb)(hr_volume_t *, size_t, errno_t);
|
---|
85 | } hr_ops_t;
|
---|
86 |
|
---|
87 | typedef struct hr_volume {
|
---|
88 | link_t lvolumes; /* link to all volumes list */
|
---|
89 | hr_ops_t hr_ops; /* level init and create fcns */
|
---|
90 | bd_srvs_t hr_bds; /* block interface to the vol */
|
---|
91 | service_id_t svc_id; /* service id */
|
---|
92 |
|
---|
93 | list_t range_lock_list; /* list of range locks */
|
---|
94 | fibril_mutex_t range_lock_list_lock; /* range locks list lock */
|
---|
95 |
|
---|
96 | hr_fpool_t *fge; /* fibril pool */
|
---|
97 |
|
---|
98 | void *in_mem_md;
|
---|
99 | fibril_mutex_t md_lock; /* lock protecting in_mem_md */
|
---|
100 |
|
---|
101 | hr_superblock_ops_t *meta_ops;
|
---|
102 |
|
---|
103 | /* invariants */
|
---|
104 | size_t extent_no; /* number of extents */
|
---|
105 | size_t bsize; /* block size */
|
---|
106 | uint64_t truncated_blkno; /* blkno per extent */
|
---|
107 | uint64_t data_blkno; /* no. of user usable blocks */
|
---|
108 | uint64_t data_offset; /* user data offset in blocks */
|
---|
109 | uint32_t strip_size; /* strip size */
|
---|
110 | hr_level_t level; /* volume level */
|
---|
111 | hr_layout_t layout; /* RAID Level Qualifier */
|
---|
112 | char devname[HR_DEVNAME_LEN];
|
---|
113 |
|
---|
114 | hr_extent_t extents[HR_MAX_EXTENTS];
|
---|
115 | fibril_rwlock_t extents_lock; /* extent service id lock */
|
---|
116 |
|
---|
117 | size_t hotspare_no; /* no. of available hotspares */
|
---|
118 | hr_extent_t hotspares[HR_MAX_HOTSPARES];
|
---|
119 | fibril_mutex_t hotspare_lock; /* lock protecting hotspares */
|
---|
120 |
|
---|
121 | fibril_rwlock_t states_lock; /* states lock */
|
---|
122 |
|
---|
123 | _Atomic bool state_dirty; /* dirty state */
|
---|
124 |
|
---|
125 | /*
|
---|
126 | * used to increment metadata counter on first write,
|
---|
127 | * allowing non-destructive read-only access
|
---|
128 | */
|
---|
129 | _Atomic bool first_write;
|
---|
130 |
|
---|
131 | _Atomic uint64_t last_ext_pos_arr[HR_MAX_EXTENTS];
|
---|
132 | _Atomic uint64_t last_ext_used;
|
---|
133 |
|
---|
134 | _Atomic uint64_t rebuild_blk; /* rebuild position */
|
---|
135 | _Atomic int open_cnt; /* open/close() counter */
|
---|
136 | hr_vol_state_t state; /* volume state */
|
---|
137 | uint8_t vflags;
|
---|
138 | } hr_volume_t;
|
---|
139 |
|
---|
140 | typedef enum {
|
---|
141 | HR_BD_READ,
|
---|
142 | HR_BD_WRITE
|
---|
143 | } hr_bd_op_type_t;
|
---|
144 |
|
---|
145 | /* macros for hr_metadata_save() */
|
---|
146 | #define WITH_STATE_CALLBACK true
|
---|
147 | #define NO_STATE_CALLBACK false
|
---|
148 |
|
---|
149 | extern errno_t hr_raid0_create(hr_volume_t *);
|
---|
150 | extern errno_t hr_raid1_create(hr_volume_t *);
|
---|
151 | extern errno_t hr_raid5_create(hr_volume_t *);
|
---|
152 |
|
---|
153 | extern errno_t hr_raid0_init(hr_volume_t *);
|
---|
154 | extern errno_t hr_raid1_init(hr_volume_t *);
|
---|
155 | extern errno_t hr_raid5_init(hr_volume_t *);
|
---|
156 |
|
---|
157 | extern void hr_raid0_vol_state_eval(hr_volume_t *);
|
---|
158 | extern void hr_raid1_vol_state_eval(hr_volume_t *);
|
---|
159 | extern void hr_raid5_vol_state_eval(hr_volume_t *);
|
---|
160 |
|
---|
161 | extern void hr_raid0_ext_state_cb(hr_volume_t *, size_t, errno_t);
|
---|
162 | extern void hr_raid1_ext_state_cb(hr_volume_t *, size_t, errno_t);
|
---|
163 | extern void hr_raid5_ext_state_cb(hr_volume_t *, size_t, errno_t);
|
---|
164 | #endif
|
---|
165 |
|
---|
166 | /** @}
|
---|
167 | */
|
---|