1 .\" Copyright (c) 2008, Sun Microsystems, Inc.  All Rights Reserved
   2 .\" Copyright (c) 2017, Joyent, Inc.
   3 .\" The contents of this file are subject to the terms of the
   4 .\" Common Development and Distribution License (the "License").
   5 .\" You may not use this file except in compliance with the License.
   6 .\"
   7 .\" You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
   8 .\" or http://www.opensolaris.org/os/licensing.
   9 .\" See the License for the specific language governing permissions
  10 .\" and limitations under the License.
  11 .\"
  12 .\" When distributing Covered Code, include this CDDL HEADER in each
  13 .\" file and include the License file at usr/src/OPENSOLARIS.LICENSE.
  14 .\" If applicable, add the following below this CDDL HEADER, with the
  15 .\" fields enclosed by brackets "[]" replaced with your own identifying
  16 .\" information: Portions Copyright [yyyy] [name of copyright owner]
  17 .Dd October 23, 2017
  18 .Dt IPNAT 7I
  19 .Os
  20 .Sh NAME
  21 .Nm ipnat
  22 .Nd IP Filter/NAT module interface
  23 .Sh DESCRIPTION
  24 The
  25 .Sy ipnat
  26 device provides interfaction with the NAT features of the Solaris IPFilter.
  27 .Sh APPLICATION PROGRAMMING INTERFACE
  28 The NAT features programming model is a component of the Solaris IP Filter and
  29 is accessed via the NAT device file
  30 .Pa /dev/ipnat .
  31 Opening the device for
  32 reading or writing determines which ioctl calls can be successfully made.
  33 .Sh IOCTLS
  34 The caller must construct a
  35 .Vt ipfobj
  36 structure when issuing a
  37 .Sy SIOCGNATL
  38 or
  39 SIOCSTPUT
  40 ioctl.
  41 The
  42 .Vt ipfobj
  43 structure is then passed
  44 to the ioctl call and is filled out with
  45 .Fa ipfo_type
  46 set to
  47 .Dv IPFOBJ_ Ns value .
  48 .Dv IPFOBJ_ Ns value
  49 provides a matching name for the structure, while
  50 .Fa ipfo_size
  51 is set to the total size of the structure being passed and
  52 .Fa ipfo_ptr
  53 is set to the structure address.
  54 The
  55 .Fa ipfo_rev
  56 structure should be set to the current value of
  57 .Dv IPFILTER_VERSION ,
  58 while
  59 .Fa ipfo_offset
  60 and
  61 .Fa ipfo_xxxpad
  62 should be set to 0.
  63 .Bd -literal -offset 2n
  64 /*
  65  * Structure used with SIOCGNATL/SIOCSTPUT.
  66  */
  67 
  68 /*
  69  * Object structure description.  For passing through in ioctls.
  70  */
  71 typedef struct  ipfobj  {
  72      u_32_t  ipfo_rev;         /* IPFilter version (IPFILTER_VERSION) */
  73      u_32_t  ipfo_size;        /* size of object at ipfo_ptr */
  74      void    *ipfo_ptr;        /* pointer to object */
  75      int     ipfo_type;        /* type of object being pointed to */
  76      int     ipfo_offset;      /* bytes from ipfo_ptr where to start */
  77      u_char  ipfo_xxxpad[32];  /* reserved for future use */
  78 } ipfobj_t;
  79 
  80 #define IPFILTER_VERSION        4010901 /* IPFilter version */
  81 #define IPFOBJ_NATSAVE          8       /* struct nat_save */
  82 #define IPFOBJ_NATLOOKUP        9       /* struct natlookup */
  83 .Ed
  84 .Pp
  85 The following
  86 .Xr ioctl 2
  87 calls may be used to manipulate the ipnat sub-system inside of ipf.
  88 Note that the ipnat driver only accept calls from applications
  89 using the same data model as the kernel.
  90 In other words, 64-bit kernels can only accept calls from 64-bit applications.
  91 Calls from 32-bit applications fail
  92 with
  93 .Er EINVAL .
  94 .Bl -tag -width SIOCSTLCK
  95 .It Dv SIOCSTLCK
  96 Set or clear the NAT lock to prevent table updates attributable to packet
  97 flow-through.
  98 .It Dv SIOCGNATL
  99 Search the NAT table for the rdr entry that matches the fields in the natlookup
 100 structure.
 101 The caller must populate the structure with the address/port
 102 information of the accepted TCP connection
 103 .Pq Fa nl_inip , Fa nl_inport
 104 and the
 105 address/port information of the peer
 106 .Pq Fa nl_outip , Fa nl_outport .
 107 The
 108 .Fa nl_flags
 109 field must have the
 110 .Dv IPN_TCP
 111 option set.
 112 All other fields must be set to 0.
 113 If the call succeeds,
 114 .Fa nl_realip
 115 and
 116 .Fa nl_realport
 117 are set to the real destination address and port, respectively.
 118 The
 119 .Fa nl_inport
 120 and
 121 .Fa nl_outport
 122 fields must be in host byte order.
 123 If
 124 .Dv IPN_FINDFORWARD
 125 is set in
 126 .Fa nl_flags ,
 127 a check is made to see if it is
 128 possible to create an outgoing NAT session by checking if a packet coming from
 129 .Pq Fa nl_realip , Fa nl_realport
 130 and destined for
 131 .Pq Fa nl_outip , Fa nl_outport
 132 can be translated.
 133 If translation is possible, the flag remains set, otherwise it is
 134 cleared in the structure returned to the caller.
 135 .Bd -literal -offset indent
 136 /*
 137  * Structure used with SIOCGNATL.
 138  */
 139 typedef struct natlookup {
 140      i6addr_t  nl_inipaddr;
 141      i6addr_t  nl_outipaddr;
 142      i6addr_t  nl_realipaddr;
 143      int       nl_v;
 144      int       nl_flags;
 145      u_short   nl_inport;
 146      u_short   nl_outport;
 147      u_short   nl_realport;
 148 } natlookup_t
 149 
 150 #define nl_inip       nl_inipaddr.in4
 151 #define nl_outip      nl_outipaddr.in4
 152 #define nl_realip     nl_realipaddr.in4
 153 #define nl_inip6      nl_inipaddr.in6
 154 #define nl_outip6     nl_outipaddr.in6
 155 #define nl_realip6    nl_realipaddr.in6
 156 
 157 /*
 158  * Accepted values for nl_flags
 159  */
 160 #define   IPN_TCP         0x00001
 161 #define   IPN_FINDFORWARD 0x400000
 162 .Ed
 163 .It Dv SIOCSTPUT
 164 Move a NAT mapping structure from user space into the kernel.
 165 This ioctl is used by
 166 .Xr ipfs 1M
 167 to restore NAT sessions saved in
 168 .Pa /var/db/ipf/ipnat.ipf .
 169 The
 170 .Vt nat_save
 171 structure must have its
 172 .Fa ipn_nat
 173 and
 174 .Fa ipn_ipnat
 175 structures filled out correctly.
 176 Fields not assigned a value must be initialised to 0.
 177 All pointer fields are adjusted, as appropriate, once the
 178 structure is passed into the kernel and none are preserved.
 179 .Pp
 180 To create a translation, the following fields must be set:
 181 .\" Force item bodies to next line using 2n width
 182 .Bl -tag -width 2n
 183 .It "Interface name"
 184 The interface name on which the host is to be exited must be
 185 set in
 186 .Fa nat_ifnames[0] .
 187 .It "Local IP address and port number"
 188 The connection's local IP address and port
 189 number are stored in network byte order using
 190 .Fa nat_inip Ns / Ns Fa nat_inport .
 191 .It "Destination address/port"
 192 The destination address/port are stored in
 193 .Fa nat_oip Ns / Ns Fa nat_oport .
 194 .It "Target address/port"
 195 The translation's target address/port is stored in
 196 .Fa nat_outip Ns / Ns Fa nat_outport .
 197 .El
 198 .Pp
 199 The caller must also precalculate the checksum adjustments necessary to
 200 complete the translation and store those values in
 201 .Fa nat_sumd
 202 (delta required for TCP  header) and
 203 .Fa nat_ipsumd
 204 (delta required for IP header).
 205 .Bd -literal -offset indent
 206 /*
 207  * Structures used with SIOCSTPUT.
 208  */
 209 typedef struct  nat_save {
 210      void            *ipn_next;
 211      struct  nat     ipn_nat;
 212      struct  ipnat   ipn_ipnat;
 213      struct  frentry ipn_fr;
 214      int             ipn_dsize;
 215      char            ipn_data[4];
 216 } nat_save_t;
 217 
 218 typedef struct  nat {
 219      ipfmutex_t      nat_lock;
 220      struct  nat     *nat_next;
 221      struct  nat     **nat_pnext;
 222      struct  nat     *nat_hnext[2];
 223      struct  nat     **nat_phnext[2];
 224      struct  hostmap *nat_hm;
 225      void            *nat_data;
 226      struct  nat     **nat_me;
 227      struct  ipstate *nat_state;
 228      struct  ap_session      *nat_aps;
 229      frentry_t       *nat_fr;
 230      struct  ipnat   *nat_ptr;
 231      void            *nat_ifps[2];
 232      void            *nat_sync;
 233      ipftqent_t      nat_tqe;
 234      u_32_t          nat_flags;
 235      u_32_t          nat_sumd[2];
 236      u_32_t          nat_ipsumd;
 237      u_32_t          nat_mssclamp;
 238      i6addr_t        nat_inip6;
 239      i6addr_t        nat_outip6;
 240      i6addr_t        nat_oip6;
 241      U_QUAD_T        nat_pkts[2];
 242      U_QUAD_T        nat_bytes[2];
 243      union   {
 244           udpinfo_t       nat_unu;
 245           tcpinfo_t       nat_unt;
 246           icmpinfo_t      nat_uni;
 247           greinfo_t       nat_ugre;
 248      } nat_un;
 249      u_short         nat_oport;
 250      u_short         nat_use;
 251      u_char          nat_p;
 252      int             nat_dir;
 253      int             nat_ref;
 254      int             nat_hv[2];
 255      char            nat_ifnames[2][LIFNAMSIZ];
 256      int             nat_rev;
 257      int             nat_v;
 258 } nat_t;
 259 
 260 #define nat_inip        nat_inip6.in4
 261 #define nat_outip       nat_outip6.in4
 262 #define nat_oip         nat_oip6.in4
 263 #define nat_inport      nat_un.nat_unt.ts_sport
 264 #define nat_outport     nat_un.nat_unt.ts_dport
 265 /*
 266  * Values for nat_dir
 267  */
 268 #define NAT_INBOUND     0
 269 #define NAT_OUTBOUND    1
 270 /*
 271  * Definitions for nat_flags
 272  */
 273 #define NAT_TCP         0x0001  /* IPN_TCP */
 274 .Ed
 275 .El
 276 .Sh EXAMPLES
 277 The following example shows how to prepare and use
 278 .Fa SIOCSTPUT
 279 to insert a NAT session directly into the table.
 280 Note that the usual TCP/IP code is omitted is this example.
 281 .Pp
 282 In the code segment below,
 283 .Fa incoming_fd
 284 is the TCP connection file descriptor
 285 that is accepted as part of the redirect process, while
 286 .Fa remote_fd
 287 is the outgoing TCP connection to the remote server being translated back to the
 288 original IP address/port pair.
 289 .Pp
 290 Note \(em
 291 The following ipnat headers must be included before you can use the code shown
 292 in this example:
 293 .Bd -literal -offset 2n
 294 #include <netinet/in.h>
 295 #include <arpa/inet.h>
 296 #include <net/if.h>
 297 #include <netinet/ipl.h>
 298 #include <netinet/ip_compat.h>
 299 #include <netinet/ip_fil.h>
 300 #include <netinet/ip_nat.h>
 301 #include <string.h>
 302 #include <fcntl.h>
 303 .Ed
 304 .Pp
 305 Note \(em
 306 In the example below, various code fragments have been excluded to enhance
 307 clarity.
 308 .Bd -literal -offset 2n
 309 int
 310 translate_connection(int incoming_fd)
 311 {
 312      struct sockaddr_in usin;
 313      struct natlookup nlp;
 314      struct nat_save ns;
 315      struct ipfobj obj;
 316      struct nat *nat;
 317      int remote_fd;
 318      int nat_fd;
 319      int onoff;
 320 
 321      memset(&ns, 0, sizeof(ns));
 322      nat = &ns.ipn_nat
 323 
 324      namelen = sizeof(usin);
 325      getsockname(remote_fd, (struct sockaddr *)&usin, &namelen);
 326 
 327      namelen = sizeof(sin);
 328      getpeername(incoming_fd, (struct sockaddr *) &sin, &namelen);
 329 
 330      namelen = sizeof(sloc);
 331      getsockname(incoming_fd, (struct sockaddr *) &sloc, &namelen);
 332 
 333      bzero((char *) &obi, sizeof(obj));
 334      obj.ipfo_rev = IPFILTER_VERSION;
 335      obj.ipfo_size = sizeof(nlp);
 336      obj.ipfo_ptr = &nip;
 337      obj.ipfo_type = IPFOBJ_NATLOOKUP;
 338 
 339      /*
 340       * Build up the NAT natlookup structure.
 341       */
 342      bzero((char *) &nlp, sizeof(nlp));
 343      nlp.nl_outip = sin.sin_addr;
 344      nlp.nl_inip = sloc.sin_addr;
 345      nlp.nl_flags = IPN_TCP;
 346      nlp.nl_outport = ntohs(sin.sin_port);
 347      nlp.nl_inport = ntohs(sloc.sin_port);
 348 
 349      /*
 350       * Open the NAT device and lookup the mapping pair.
 351       */
 352      nat_fd = open(IPNAT_NAME, O_RDWR);
 353      if (ioctl(nat_fd, SIOCGNATL, &obj) != 0)
 354           return -1;
 355 
 356      nat->nat_inip = usin.sin_addr;
 357      nat->nat_outip = nlp.nl_outip;
 358      nat->nat_oip = nlp.nl_realip;
 359 
 360      sum1 = LONG_SUM(ntohl(usin.sin_addr.s_addr)) +
 361             ntohs(usin.sin_port);
 362      sum2 = LONG_SUM(ntohl(nat->nat_outip.s_addr)) +
 363             ntohs(nlp.nl_outport);
 364      CALC_SUMD(sum1, sum2, sumd);
 365      nat->nat_sumd[0] = (sumd & 0xffff) + (sumd >> 16);
 366      nat->nat_sumd[1] = nat->nat_sumd[0];
 367 
 368      sum1 = LONG_SUM(ntohl(usin.sin_addr.s_addr));
 369      sum2 = LONG_SUM(ntohl(nat->nat_outip.s_addr));
 370      CALC_SUMD(sum1, sum2, sumd);
 371      nat->nat_ipsumd = (sumd & 0xffff) + (sumd >> 16);
 372 
 373      nat->nat_inport = usin.sin_port;
 374      nat->nat_outport = nlp.nl_outport;
 375      nat->nat_oport = nlp.nl_realport;
 376 
 377      nat->nat_flags = IPN_TCPUDP;
 378 
 379      /*
 380       * Prepare the ipfobj structure, accordingly.
 381       */
 382      bzero((char *)&obi, sizeof(obj));
 383      obj.ipfo_rev = IPFILTER_VERSION;
 384      obj.ipfo_size = sizeof(*nsp);
 385      obj.ipfo_ptr = nsp;
 386      obj.ipfo_type = IPFOBJ_NATSAVE;
 387 
 388      onoff = 1;
 389      if (ioctl(nat_fd, SIOCSTPUT, &obj) != 0)
 390           fprintf(stderr, "Error occurred\en");
 391 
 392      return connect(rem_fd, (struct sockaddr)&usin, sizeof(usin));
 393 }
 394 .Ed
 395 .Sh ERRORS
 396 .Bl -tag -width Er
 397 .It Er EPERM
 398 The device has been opened for reading only.
 399 To succeed, the ioctl call must be opened for both reading and writing.
 400 The call may be returned if it is
 401 privileged and the calling process did not assert
 402 .Brq Sy PRIV_SYS_NET_CONFIG
 403 in the effective set.
 404 .It Er ENOMEM
 405 More memory was allocated than the kernel can provide.
 406 The call may also be returned if the application inserts a NAT entry that
 407 exceeds the hash bucket chain's maximum length.
 408 .It Er EFAULT
 409 The calling process specified an invalid pointer in the ipfobj structure.
 410 .It Er EINVAL
 411 The calling process detected a parameter or field set to an unacceptable value.
 412 .It Er EEXIST
 413 The calling process, via
 414 .Dv SIOCSTPUT ,
 415 attempted to add a NAT entry that already exists in the NAT table.
 416 .It Er ESRCH
 417 The calling process called
 418 .Dv SIOCSTPUT
 419 before setting the
 420 .Dv SI_NEWFR
 421 flag and providing a pointer in the
 422 .Fa nat_fr
 423 field that cannot  be found in the current rule set.
 424 .It Er EACESS
 425 The calling process issued a
 426 .Dv SIOCSTPUT
 427 before issuing a
 428 .Dv SIOCSTLCK .
 429 .El
 430 .Sh INTERFACE STABILITY
 431 Committed
 432 .Sh SEE ALSO
 433 .Xr ipfs 1M ,
 434 .Xr ipnat 1M ,
 435 .Xr ioctl 2 ,
 436 .Xr attributes 5