1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453
|
/* declarations of routines that interface with the kernel's IPsec mechanism
* Copyright (C) 1998-2001,2013 D. Hugh Redelmeier <hugh@mimosa.com>
* Copyright (C) 2011 Michael Richardson <mcr@sandelman.ca>
* Copyright (C) 2012 Avesh Agarwal <avagarwa@redhat.com>
* Copyright (C) 2013 Kim Heino <b@bbbs.net>
* Copyright (C) 2013 Tuomo Soini <tis@foobar.fi>
* Copyright (C) 2012-2013 Paul Wouters <paul@libreswan.org>
* Copyright (C) 2019 Andrew Cagney <cagney@gnu.org>
* Copyright (C) 2019 Paul Wouters <pwouters@redhat.com>
* Copyright (C) 2017 Mayank Totale <mtotale@gmail.com>
*
* This program is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License as published by the
* Free Software Foundation; either version 2 of the License, or (at your
* option) any later version. See <https://www.gnu.org/licenses/gpl2.txt>.
*
* This program is distributed in the hope that it will be useful, but
* WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
* or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* for more details.
*
*/
#ifndef KERNEL_H
#define KERNEL_H
#include <net/if.h>
#include "monotime.h"
#include "reqid.h"
#include "connections.h" /* for struct sa_marks et.al. */
#include "ip_said.h" /* for SA_AH et.al. */
#include "ip_packet.h"
#include "kernel_mode.h"
struct sa_marks;
struct spd;
struct iface_device;
struct kernel_iface;
struct show;
struct kernel_policy;
enum kernel_state_id { DEFAULT_KERNEL_STATE_ID, }; /* sizeof() >= sizeof(uint32_t) */
enum kernel_policy_id { DEFAULT_KERNEL_POLICY_ID, }; /* sizeof() >= sizeof(uint32_t) */
/*
* Declare policy things early enough for uses.
* Some of these things, while they seem like they are KLIPS-only, the
* definitions are in fact needed by all kernel interfaces at this time.
*
* Flags are encoded above the low-order byte of verbs.
* "real" eroutes are only outbound. Inbound eroutes don't exist,
* but an addflow with an INBOUND flag allows IPIP tunnels to be
* limited to appropriate source and destination addresses.
*/
enum kernel_policy_op {
/* three bits */
KERNEL_POLICY_OP_ADD = 1,
KERNEL_POLICY_OP_REPLACE = 2,
};
extern const struct enum_names kernel_policy_op_names;
enum direction {
DIRECTION_INBOUND = 2, /*>true*/
DIRECTION_OUTBOUND = 4, /* so lset_t works */
};
extern const struct enum_names direction_names;
enum directions {
DIRECTIONS_INBOUND = DIRECTION_INBOUND,
DIRECTIONS_OUTBOUND = DIRECTION_OUTBOUND,
DIRECTIONS_INBOUND_AND_OUTBOUND = DIRECTION_INBOUND|DIRECTION_OUTBOUND,
};
/*
* What to do when the kernel policy operation returns ENOENT?
*/
enum expect_kernel_policy {
/* Kernel policy can return either ENOENT or 0. */
KERNEL_POLICY_PRESENT_OR_MISSING,
KERNEL_POLICY_PRESENT,
KERNEL_POLICY_MISSING,
};
#define expect_kernel_policy(DIRECTIONS, DIRECTION) \
(DIRECTIONS & DIRECTION ? KERNEL_POLICY_PRESENT : KERNEL_POLICY_MISSING)
#define expect_kernel_policy_name(E) \
({ \
enum expect_kernel_policy e_ = E; \
const char *n_ = "?"; \
switch (e_) { \
case KERNEL_POLICY_PRESENT_OR_MISSING: n_ = "PRESENT or MISSING"; break; \
case KERNEL_POLICY_MISSING: n_ = "MISSING"; break; \
case KERNEL_POLICY_PRESENT: n_ = "PRESENT"; break; \
} \
n_; \
})
enum kernel_offload_type {
KERNEL_OFFLOAD_NONE,
KERNEL_OFFLOAD_CRYPTO,
KERNEL_OFFLOAD_PACKET,
};
struct nic_offload {
const char *dev;
enum kernel_offload_type type;
};
/*
* The CHILD (IPsec, kernel) SA has two IP ends.
*/
struct kernel_state_end {
/*
* For ESP/AH which is carried by raw IP packets, only an
* address is needed to identify an end. However when
* encapsulated (in UDP or TCP) the port is also needed.
*
* Why not an endpoint so that it encapsulates the port and,
* for that matter the protocol?
*/
ip_address address;
int encap_port;
/*
* This is not the subnet you're looking for: the transport
* selector or packet filter.
*
* XXX: old comment?
*
* The route addresses of the encapsulated packets.
*
* With pfkey and transport mode with nat-traversal we need to
* change the remote IPsec SA to point to external ip of the
* peer. Here we substitute real client ip with NATD ip.
*
* Bug #1004 fix.
*
* There really isn't "client" with XFRM and transport mode so
* eroute must be done to natted, visible ip. If we don't hide
* internal IP, communication doesn't work.
*/
ip_selector route;
};
struct kernel_state {
const char *story;
struct kernel_state_end src;
struct kernel_state_end dst;
/*
* Is the stack using tunnel mode; and if it is does this SA
* need the tunnel-mode bit?
*
* In tunnel mode, only the inner-most SA (level==0) should
* have the tunnel-mode bit set. And in transport mode, all
* SAs get selectors.
*/
enum kernel_mode mode;
unsigned level; /* inner-most is 0 */
enum direction direction;
ipsec_spi_t spi;
const struct ip_protocol *proto; /* ESP, AH, IPCOMP */
const struct ip_encap *encap_type; /* ESP-in-TCP, ESP-in-UDP; or NULL */
enum kernel_state_id state_id; /* linux calls this seq */
reqid_t reqid;
bool esn;
unsigned replay_window;
const struct encrypt_desc *encrypt;
shunk_t encrypt_key;
const struct integ_desc *integ;
shunk_t integ_key;
const struct ipcomp_desc *ipcomp;
chunk_t sec_label;
const struct ipsec_interface *ipsec_interface;
uint64_t sa_ipsec_max_bytes;
uint64_t sa_max_soft_bytes;
uint64_t sa_ipsec_max_packets;
uint64_t sa_max_soft_packets;
deltatime_t sa_lifetime; /* number of seconds until SA expires */
struct nic_offload nic_offload;
/* linux jibberish */
const struct sa_mark *sa_mark_out; /* config keyword mark-out */
bool decap_dscp;
bool encap_dscp;
bool nopmtudisc;
uint32_t tfcpad;
const struct config_iptfs *iptfs; /* non-NULL when enabled */
};
struct kernel_ops {
/*
* The names used to identify the interface.
*
* It's assumed that protostack=PROTOSTACK_NAMES[0] is
* preferred.
*/
const char **protostack_names;
/*
* This name is fed to updown using the environment variable
* PLUTO_STACK. It needs to match the _updown.* name that was
* installed.
*
* Typically its the same as PROTOSTACK_NAMES[0]. But not
* necessarially. On BSD it's currently "bsdkame", but could
* easily be renamed to "setkey" as it is the setkey command
* that is used to manage the interface.
*/
const char *updown_name;
/*
* The user friendly name to used when logging errors.
*/
const char *interface_name;
bool overlap_supported;
bool sha2_truncbug_support;
bool esn_supported;
uintmax_t max_replay_window;
void (*init)(struct logger *logger);
void (*flush)(struct logger *logger);
void (*poke_holes)(struct logger *logger);
void (*plug_holes)(struct logger *logger);
void (*shutdown)(struct logger *logger);
bool (*policy_add)(enum kernel_policy_op op,
enum direction dir,
const ip_selector *src_client,
const ip_selector *dst_client,
const struct kernel_policy *policy,
deltatime_t use_lifetime,
struct logger *logger,
const char *func);
bool (*policy_del)(enum direction dir,
enum expect_kernel_policy expect_kernel_policy,
const ip_selector *src_client,
const ip_selector *dst_client,
const struct sa_marks *sa_marks,
const struct ipsec_interface *xfrmi,
enum kernel_policy_id id,
const shunk_t sec_label, /*needed*/
struct logger *logger,
const char *func);
/*
* XXX: to delete an SA, delete it's SPI.
*/
bool (*add_sa)(const struct kernel_state *sa,
bool replace,
struct logger *logger);
bool (*get_kernel_state)(const struct kernel_state *sa,
uint64_t *bytes,
uint64_t *add_time,
uint64_t *lastused,
struct logger *logger);
/*
* Allocate and delete IPsec ESP/AH (IPCOMP) SPIs. (creating a
* larval kernel state).
*
* Compression IDs are allocated using the same system call;
* except the MIN/MAX is smaller and IPCOMP is specified as
* the protocol.
*
* Typically the larval kernel state is matured by adding the
* negotiated crypto, key, et.al.
*
*
* When deleting the kernel state (larval, mature, ...) only
* the SPI and addresses are needed.
*/
ipsec_spi_t (*get_ipsec_spi)(ipsec_spi_t avoid,
const ip_address *src,
const ip_address *dst,
const struct ip_protocol *proto,
reqid_t reqid,
uintmax_t min, uintmax_t max,
const char *story, /* often SAID string */
struct logger *logger);
bool (*del_ipsec_spi)(ipsec_spi_t spi,
const struct ip_protocol *proto,
const ip_address *src,
const ip_address *dst,
const char *story, /* often SAID string */
struct logger *logger);
/*
* Returns NULL(ok) or what needs to be enabled.
*/
err_t (*migrate_ipsec_sa_is_enabled)(struct logger *);
bool (*migrate_ipsec_sa)(struct child_sa *child);
err_t (*iptfs_ipsec_sa_is_enabled)(struct logger *);
bool (*iptfs_ipsec_sa)(struct child_sa *child);
err_t (*directional_ipsec_sa_is_enabled)(struct logger *);
bool (*directional_ipsec_sa)(struct child_sa *child);
bool (*poke_ipsec_policy_hole)(int fd, const struct ip_info *afi, struct logger *logger);
bool (*detect_nic_offload)(const char *name, struct logger *logger);
bool (*poke_ipsec_offload_policy_hole)(struct nic_offload *nic_offload, struct logger *logger);
/* extensions */
const struct kernel_ipsec_interface *ipsec_interface;
};
extern int create_socket(const struct kernel_iface *ifp, const char *v_name, int port, int proto);
extern const struct kernel_ops *kernel_ops;
#ifdef KERNEL_XFRM
extern const struct kernel_ops xfrm_kernel_ops;
#endif
#ifdef KERNEL_PFKEYV2
extern const struct kernel_ops pfkeyv2_kernel_ops;
#endif
extern const struct kernel_ops *const kernel_stacks[];
/* bare (connectionless) shunt (eroute) table
*
* Bare shunts are those that don't "belong" to a connection.
* This happens because some %trapped traffic hasn't yet or cannot be
* assigned to a connection. The usual reason is that we cannot discover
* the peer SG. Another is that even when the peer has been discovered,
* it may be that no connection matches all the particulars.
* We record them so that, with scanning, we can discover
* which %holds are news and which others should expire.
*/
#define SHUNT_SCAN_INTERVAL_SECONDS (2*10)
#define SHUNT_SCAN_INTERVAL deltatime(SHUNT_SCAN_INTERVAL_SECONDS) /* time between scans of eroutes */
/* SHUNT_PATIENCE only has resolution down to a multiple of the sample rate,
* SHUNT_SCAN_INTERVAL.
* By making SHUNT_PATIENCE an odd multiple of half of SHUNT_SCAN_INTERVAL,
* we minimize the effects of jitter.
*/
#define SHUNT_PATIENCE deltatime(SHUNT_SCAN_INTERVAL_SECONDS * 15 / 2) /* inactivity timeout */
#define PLUTO_SHUNT_LIFE_DURATION_DEFAULT deltatime(15 * secs_per_minute)
extern deltatime_t bare_shunt_interval;
extern deltatime_t pluto_shunt_lifetime;
extern void show_shunt_status(struct show *);
extern unsigned shunt_count(void);
struct bare_shunt **bare_shunt_ptr(const ip_selector *ours,
const ip_selector *peers,
const char *why);
void free_bare_shunt(struct bare_shunt **pp);
/* A netlink header defines EM_MAXRELSPIS, the max number of SAs in a group.
* Is there a PF_KEY equivalent?
*/
#ifndef EM_MAXRELSPIS
# define EM_MAXRELSPIS 4 /* AH ESP IPCOMP IPIP */
#endif
extern void init_kernel(struct logger *logger);
extern bool flush_bare_shunt(const ip_address *src, const ip_address *dst,
const struct ip_protocol *transport_proto,
enum expect_kernel_policy expect_kernel_policy,
const char *why, struct logger *logger);
void orphan_holdpass(struct connection *c,
struct spd *sr,
struct logger *logger);
extern ipsec_spi_t get_ipsec_spi(const struct connection *c,
const struct ip_protocol *proto,
ipsec_spi_t avoid,
struct logger *logger/*state*/);
extern ipsec_spi_t get_ipsec_cpi(const struct connection *c,
struct logger *logger/*state*/);
bool unrouted_to_routed(struct connection *c, enum routing new_routing, where_t where);
bool install_inbound_ipsec_sa(struct child_sa *child, enum routing new_routing, where_t where);
struct do_updown {
bool up;
bool route;
};
bool install_outbound_ipsec_sa(struct child_sa *child, enum routing new_routing,
struct do_updown updown, where_t where);
void teardown_ipsec_kernel_states(struct child_sa *child);
void uninstall_kernel_states(struct child_sa *child);
extern bool was_eroute_idle(struct child_sa *child, deltatime_t idle_max);
extern bool get_ipsec_traffic(struct child_sa *child, struct ipsec_proto_info *sa, enum direction direction);
bool kernel_ops_migrate_ipsec_sa(struct child_sa *child);
extern void show_kernel_interface(struct show *s);
void shutdown_kernel(struct logger *logger);
extern bool kernel_ops_detect_nic_offload(const char *name, struct logger *logger);
extern void handle_sa_expire(ipsec_spi_t spi, uint8_t protoid, ip_address dst,
bool hard, uint64_t bytes, uint64_t packets, uint64_t add_time,
struct logger *logger);
typedef struct { uint32_t value; } spd_priority_t;
#define PRI_SPD_PRIORITY PRIu32
#define pri_spd_priority(P) (P).value
extern const spd_priority_t highest_spd_priority;
spd_priority_t spd_priority(const struct spd *spd);
struct kernel_acquire {
ip_packet packet; /* that triggered the on-demand exchange */
bool by_acquire; /* by kernel acquire, else by whack */
const struct logger *logger; /* on stack, could have whack attached */
bool background; /* close whackfd once started */
shunk_t sec_label; /* on stack */
enum kernel_state_id state_id; /* matches kernel state's .seq? */
enum kernel_policy_id policy_id; /* matches kernel policy's .index? */
};
void jam_kernel_acquire(struct jambuf *buf, const struct kernel_acquire *b);
void setup_esp_nic_offload(struct nic_offload *nic_offload,
const struct connection *c,
struct logger *logger);
struct spd_owner spd_owner(const struct spd *spd, enum routing new_routing,
struct logger *logger, where_t where);
void clear_connection_spd_conflicts(struct connection *c);
bool get_connection_spd_conflict(const struct spd *spd,
const enum routing new_routing,
struct spd_owner *owner,
struct bare_shunt ***bare_shunt,
struct logger *logger);
void clear_narrow_holds(const ip_selector *src_client,
const ip_selector *dst_client,
struct logger *logger);
void revert_kernel_policy(struct spd *spd,
struct child_sa *child/*could be NULL*/,
struct logger *logger);
#endif
|