1204076Spjd/*-
2204076Spjd * Copyright (c) 2009-2010 The FreeBSD Foundation
3219351Spjd * Copyright (c) 2011 Pawel Jakub Dawidek <pawel@dawidek.net>
4204076Spjd * All rights reserved.
5204076Spjd *
6204076Spjd * This software was developed by Pawel Jakub Dawidek under sponsorship from
7204076Spjd * the FreeBSD Foundation.
8204076Spjd *
9204076Spjd * Redistribution and use in source and binary forms, with or without
10204076Spjd * modification, are permitted provided that the following conditions
11204076Spjd * are met:
12204076Spjd * 1. Redistributions of source code must retain the above copyright
13204076Spjd *    notice, this list of conditions and the following disclaimer.
14204076Spjd * 2. Redistributions in binary form must reproduce the above copyright
15204076Spjd *    notice, this list of conditions and the following disclaimer in the
16204076Spjd *    documentation and/or other materials provided with the distribution.
17204076Spjd *
18204076Spjd * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
19204076Spjd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20204076Spjd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21204076Spjd * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
22204076Spjd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23204076Spjd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24204076Spjd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25204076Spjd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26204076Spjd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27204076Spjd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28204076Spjd * SUCH DAMAGE.
29204076Spjd *
30204076Spjd * $FreeBSD$
31204076Spjd */
32204076Spjd
33204076Spjd#ifndef	_HAST_H_
34204076Spjd#define	_HAST_H_
35204076Spjd
36204076Spjd#include <sys/queue.h>
37204076Spjd#include <sys/socket.h>
38204076Spjd
39204076Spjd#include <arpa/inet.h>
40204076Spjd
41204076Spjd#include <netinet/in.h>
42204076Spjd
43204076Spjd#include <limits.h>
44204076Spjd#include <pthread.h>
45204076Spjd#include <stdbool.h>
46204076Spjd#include <stdint.h>
47204076Spjd
48204076Spjd#include <activemap.h>
49204076Spjd
50204076Spjd#include "proto.h"
51204076Spjd
52211882Spjd/*
53211882Spjd * Version history:
54211882Spjd * 0 - initial version
55211882Spjd * 1 - HIO_KEEPALIVE added
56249236Strociny * 2 - "memsync" and "received" attributes added for memsync mode
57211882Spjd */
58249236Strociny#define	HAST_PROTO_VERSION	2
59204076Spjd
60204076Spjd#define	EHAST_OK		0
61204076Spjd#define	EHAST_NOENTRY		1
62204076Spjd#define	EHAST_INVALID		2
63204076Spjd#define	EHAST_NOMEMORY		3
64204076Spjd#define	EHAST_UNIMPLEMENTED	4
65204076Spjd
66204076Spjd#define	HASTCTL_CMD_UNKNOWN	0
67204076Spjd#define	HASTCTL_CMD_SETROLE	1
68204076Spjd#define	HASTCTL_CMD_STATUS	2
69204076Spjd
70204076Spjd#define	HAST_ROLE_UNDEF		0
71204076Spjd#define	HAST_ROLE_INIT		1
72204076Spjd#define	HAST_ROLE_PRIMARY	2
73204076Spjd#define	HAST_ROLE_SECONDARY	3
74204076Spjd
75204076Spjd#define	HAST_SYNCSRC_UNDEF	0
76204076Spjd#define	HAST_SYNCSRC_PRIMARY	1
77204076Spjd#define	HAST_SYNCSRC_SECONDARY	2
78204076Spjd
79204076Spjd#define	HIO_UNDEF		0
80204076Spjd#define	HIO_READ		1
81204076Spjd#define	HIO_WRITE		2
82204076Spjd#define	HIO_DELETE		3
83204076Spjd#define	HIO_FLUSH		4
84211882Spjd#define	HIO_KEEPALIVE		5
85204076Spjd
86222108Spjd#define	HAST_USER		"hast"
87222108Spjd#define	HAST_TIMEOUT		20
88222108Spjd#define	HAST_CONFIG		"/etc/hast.conf"
89222108Spjd#define	HAST_CONTROL		"/var/run/hastctl"
90222119Spjd#define	HASTD_LISTEN_TCP4	"tcp4://0.0.0.0:8457"
91222119Spjd#define	HASTD_LISTEN_TCP6	"tcp6://[::]:8457"
92222108Spjd#define	HASTD_PIDFILE		"/var/run/hastd.pid"
93204076Spjd
94204076Spjd/* Default extent size. */
95204076Spjd#define	HAST_EXTENTSIZE	2097152
96204076Spjd/* Default maximum number of extents that are kept dirty. */
97204076Spjd#define	HAST_KEEPDIRTY	64
98204076Spjd
99204076Spjd#define	HAST_ADDRSIZE	1024
100204076Spjd#define	HAST_TOKEN_SIZE	16
101204076Spjd
102219721Strociny/* Number of seconds to sleep between reconnect retries or keepalive packets. */
103219721Strociny#define	HAST_KEEPALIVE	10
104219721Strociny
105222108Spjdstruct hastd_listen {
106222108Spjd	/* Address to listen on. */
107222108Spjd	char	 hl_addr[HAST_ADDRSIZE];
108222108Spjd	/* Protocol-specific data. */
109222108Spjd	struct proto_conn *hl_conn;
110222108Spjd	TAILQ_ENTRY(hastd_listen) hl_next;
111222108Spjd};
112222108Spjd
113204076Spjdstruct hastd_config {
114204076Spjd	/* Address to communicate with hastctl(8). */
115229509Strociny	char	hc_controladdr[HAST_ADDRSIZE];
116204076Spjd	/* Protocol-specific data. */
117204076Spjd	struct proto_conn *hc_controlconn;
118217969Spjd	/* Incoming control connection. */
119217969Spjd	struct proto_conn *hc_controlin;
120229509Strociny	/* PID file path. */
121229509Strociny	char	hc_pidfile[PATH_MAX];
122222108Spjd	/* List of addresses to listen on. */
123222108Spjd	TAILQ_HEAD(, hastd_listen) hc_listen;
124204076Spjd	/* List of resources. */
125204076Spjd	TAILQ_HEAD(, hast_resource) hc_resources;
126204076Spjd};
127204076Spjd
128204076Spjd#define	HAST_REPLICATION_FULLSYNC	0
129204076Spjd#define	HAST_REPLICATION_MEMSYNC	1
130204076Spjd#define	HAST_REPLICATION_ASYNC		2
131204076Spjd
132219354Spjd#define	HAST_COMPRESSION_NONE	0
133219354Spjd#define	HAST_COMPRESSION_HOLE	1
134219354Spjd#define	HAST_COMPRESSION_LZF	2
135219354Spjd
136219351Spjd#define	HAST_CHECKSUM_NONE	0
137219351Spjd#define	HAST_CHECKSUM_CRC32	1
138219351Spjd#define	HAST_CHECKSUM_SHA256	2
139219351Spjd
140260007Strocinystruct nv;
141260007Strociny
142204076Spjd/*
143204076Spjd * Structure that describes single resource.
144204076Spjd */
145204076Spjdstruct hast_resource {
146204076Spjd	/* Resource name. */
147204076Spjd	char	hr_name[NAME_MAX];
148249236Strociny	/* Negotiated replication mode (HAST_REPLICATION_*). */
149204076Spjd	int	hr_replication;
150249236Strociny	/* Configured replication mode (HAST_REPLICATION_*). */
151249236Strociny	int	hr_original_replication;
152204076Spjd	/* Provider name that will appear in /dev/hast/. */
153204076Spjd	char	hr_provname[NAME_MAX];
154204076Spjd	/* Synchronization extent size. */
155204076Spjd	int	hr_extentsize;
156204076Spjd	/* Maximum number of extents that are kept dirty. */
157204076Spjd	int	hr_keepdirty;
158211886Spjd	/* Path to a program to execute on various events. */
159211886Spjd	char	hr_exec[PATH_MAX];
160219354Spjd	/* Compression algorithm. */
161219354Spjd	int	hr_compression;
162219351Spjd	/* Checksum algorithm. */
163219351Spjd	int	hr_checksum;
164249236Strociny	/* Protocol version. */
165249236Strociny	int	hr_version;
166204076Spjd
167204076Spjd	/* Path to local component. */
168204076Spjd	char	hr_localpath[PATH_MAX];
169204076Spjd	/* Descriptor to access local component. */
170204076Spjd	int	hr_localfd;
171204076Spjd	/* Offset into local component. */
172204076Spjd	off_t	hr_localoff;
173204076Spjd	/* Size of usable space. */
174204076Spjd	off_t	hr_datasize;
175204076Spjd	/* Size of entire local provider. */
176204076Spjd	off_t	hr_local_mediasize;
177204076Spjd	/* Sector size of local provider. */
178204076Spjd	unsigned int hr_local_sectorsize;
179229509Strociny	/* Is flushing write cache supported by the local provider? */
180229509Strociny	bool	hr_localflush;
181229509Strociny	/* Flush write cache on metadata updates? */
182229509Strociny	int	hr_metaflush;
183204076Spjd
184204076Spjd	/* Descriptor for /dev/ggctl communication. */
185204076Spjd	int	hr_ggatefd;
186204076Spjd	/* Unit number for ggate communication. */
187204076Spjd	int	hr_ggateunit;
188204076Spjd
189204076Spjd	/* Address of the remote component. */
190204076Spjd	char	hr_remoteaddr[HAST_ADDRSIZE];
191219818Spjd	/* Local address to bind to for outgoing connections. */
192219818Spjd	char	hr_sourceaddr[HAST_ADDRSIZE];
193204076Spjd	/* Connection for incoming data. */
194204076Spjd	struct proto_conn *hr_remotein;
195204076Spjd	/* Connection for outgoing data. */
196204076Spjd	struct proto_conn *hr_remoteout;
197204076Spjd	/* Token to verify both in and out connection are coming from
198204076Spjd	   the same node (not necessarily from the same address). */
199204076Spjd	unsigned char hr_token[HAST_TOKEN_SIZE];
200207371Spjd	/* Connection timeout. */
201207371Spjd	int	hr_timeout;
202204076Spjd
203204076Spjd	/* Resource unique identifier. */
204204076Spjd	uint64_t hr_resuid;
205204076Spjd	/* Primary's local modification count. */
206204076Spjd	uint64_t hr_primary_localcnt;
207204076Spjd	/* Primary's remote modification count. */
208204076Spjd	uint64_t hr_primary_remotecnt;
209204076Spjd	/* Secondary's local modification count. */
210204076Spjd	uint64_t hr_secondary_localcnt;
211204076Spjd	/* Secondary's remote modification count. */
212204076Spjd	uint64_t hr_secondary_remotecnt;
213204076Spjd	/* Synchronization source. */
214204076Spjd	uint8_t hr_syncsrc;
215204076Spjd
216204076Spjd	/* Resource role: HAST_ROLE_{INIT,PRIMARY,SECONDARY}. */
217204076Spjd	int	hr_role;
218204076Spjd	/* Previous resource role: HAST_ROLE_{INIT,PRIMARY,SECONDARY}. */
219204076Spjd	int	hr_previous_role;
220204076Spjd	/* PID of child worker process. 0 - no child. */
221204076Spjd	pid_t	hr_workerpid;
222218218Spjd	/* Control commands from parent to child. */
223204076Spjd	struct proto_conn *hr_ctrl;
224212038Spjd	/* Events from child to parent. */
225212038Spjd	struct proto_conn *hr_event;
226218218Spjd	/* Connection requests from child to parent. */
227218218Spjd	struct proto_conn *hr_conn;
228204076Spjd
229204076Spjd	/* Activemap structure. */
230204076Spjd	struct activemap *hr_amp;
231256027Strociny	/* Lock used to synchronize access to hr_amp. */
232204076Spjd	pthread_mutex_t hr_amp_lock;
233256027Strociny	/* Lock used to synchronize access to hr_amp diskmap. */
234256027Strociny	pthread_mutex_t hr_amp_diskmap_lock;
235204076Spjd
236222228Spjd	/* Number of BIO_READ requests. */
237222228Spjd	uint64_t	hr_stat_read;
238222228Spjd	/* Number of BIO_WRITE requests. */
239222228Spjd	uint64_t	hr_stat_write;
240222228Spjd	/* Number of BIO_DELETE requests. */
241222228Spjd	uint64_t	hr_stat_delete;
242222228Spjd	/* Number of BIO_FLUSH requests. */
243222228Spjd	uint64_t	hr_stat_flush;
244222228Spjd	/* Number of activemap updates. */
245222228Spjd	uint64_t	hr_stat_activemap_update;
246247866Strociny	/* Number of local read errors. */
247247866Strociny	uint64_t	hr_stat_read_error;
248247866Strociny	/* Number of local write errors. */
249247866Strociny	uint64_t	hr_stat_write_error;
250247866Strociny	/* Number of local delete errors. */
251247866Strociny	uint64_t	hr_stat_delete_error;
252247866Strociny	/* Number of flush errors. */
253247866Strociny	uint64_t	hr_stat_flush_error;
254247866Strociny	/* Number of activemap write errors. */
255247866Strociny	uint64_t	hr_stat_activemap_write_error;
256247866Strociny	/* Number of activemap flush errors. */
257247866Strociny	uint64_t	hr_stat_activemap_flush_error;
258222228Spjd
259260007Strociny	/* Function to output worker specific info on control status request. */
260260007Strociny	void	(*output_status_aux)(struct nv *);
261260007Strociny
262204076Spjd	/* Next resource. */
263204076Spjd	TAILQ_ENTRY(hast_resource) hr_next;
264204076Spjd};
265204076Spjd
266210883Spjdstruct hastd_config *yy_config_parse(const char *config, bool exitonerror);
267204076Spjdvoid yy_config_free(struct hastd_config *config);
268204076Spjd
269204076Spjdint yyparse(void);
270204076Spjd
271204076Spjd#endif	/* !_HAST_H_ */
272