package cstruct

  1. Overview
  2. Docs

Description

Cstruct is a library and syntax extension to make it easier to access C-like structures directly from OCaml. It supports both reading and writing to these structures, and they are accessed via the Bigarray module.

Tags

org:mirage org:ocamllabs

Published: 27 Mar 2019

README

Cstruct -- access C-like structures directly from OCaml

v4.0.0

Cstruct is a library and syntax extension to make it easier to access C-like structures directly from OCaml. It supports both reading and writing to these structures, and they are accessed via the Bigarray module.

Installation

This repository provides several packages that can be installed via the OPAM package manager:

  • cstruct: the core Cstruct library

  • cstruct-sexp: serialisers into s-expression format of Cstructs

  • cstruct-unix: provide Unix variations of the read/write functions using file descriptors

  • cstruct-async: provide Async Pipe and Bigstring support

  • cstruct-lwt: provide Lwt variants of read/write functions

  • ppx_cstruct: a PPX syntax extension (see below)

The libraries depend on OCaml version 4.02.3 and later, since it provides a ppx extension point. The old camlp4 syntax extension is nolonger available; the last cstruct release which contained it was v1.9.0.

Local development

You can build the library via dune, using make or dune build directly. Since everything is built via dune, you can also place this repository within a wider dune workspace in order to make local modifications across repositories.

Usage

PPX

The PPX processor is used by passing the OCaml source code through the ppx_cstruct binary. An example pcap description is:

[%%cstruct
type pcap_header = {
  magic_number: uint32_t;   (* magic number *)
  version_major: uint16_t;  (* major version number *)
  version_minor: uint16_t;  (* minor version number *)
  thiszone: uint32_t;       (* GMT to local correction *)
  sigfigs: uint32_t;        (* accuracy of timestamps *)
  snaplen: uint32_t;        (* max length of captured packets, in octets *)
  network: uint32_t;        (* data link type *)
} [@@little_endian]]

[%%cstruct
type pcap_packet = {
  ts_sec: uint32_t;         (* timestamp seconds *)
  ts_usec: uint32_t;        (* timestamp microseconds *)
  incl_len: uint32_t;       (* number of octets of packet saved in file *)
  orig_len: uint32_t;       (* actual length of packet *)
} [@@little_endian]]

[%%cstruct
type ethernet = {
  dst: uint8_t [@len 6];
  src: uint8_t [@len 6];
  ethertype: uint16_t;
} [@@big_endian]]

[%%cstruct
type ipv4 = {
  hlen_version: uint8_t;
  tos: uint8_t;
  len: uint16_t;
  id: uint16_t;
  off: uint16_t;
  ttl: uint8_t;
  proto: uint8_t;
  csum: uint16_t;
  src: uint8_t [@len 4];
  dst: uint8_t [@len 4];
} [@@big_endian]]

This auto-generates generates functions of the form below in the ml file:

let sizeof_pcap_packet = 16
let get_pcap_packet_ts_sec v = Cstruct.LE.get_uint32 v 0
let set_pcap_packet_ts_sec v x = Cstruct.LE.set_uint32 v 0 x
let get_pcap_packet_ts_usec v = Cstruct.LE.get_uint32 v 4
let set_pcap_packet_ts_usec v x = Cstruct.LE.set_uint32 v 4 x
let get_pcap_packet_incl_len v = Cstruct.LE.get_uint32 v 8
let set_pcap_packet_incl_len v x = Cstruct.LE.set_uint32 v 8 x
let get_pcap_packet_orig_len v = Cstruct.LE.get_uint32 v 12
let set_pcap_packet_orig_len v x = Cstruct.LE.set_uint32 v 12 x

let sizeof_ethernet = 14
let get_ethernet_dst src = Cstruct.sub src 0 6
let copy_ethernet_dst src = Cstruct.copy src 0 6
let set_ethernet_dst src srcoff dst =
  Cstruct.blit_from_string src srcoff dst 0 6
let blit_ethernet_dst src srcoff dst = Cstruct.blit src srcoff dst 0 6
let get_ethernet_src src = Cstruct.sub src 6 6
let copy_ethernet_src src = Cstruct.copy src 6 6
let set_ethernet_src src srcoff dst =
  Cstruct.blit_from_string src srcoff dst 6 6
let blit_ethernet_src src srcoff dst = Cstruct.blit src srcoff dst 6 6
let get_ethernet_ethertype v = Cstruct.BE.get_uint16 v 12
let set_ethernet_ethertype v x = Cstruct.BE.set_uint16 v 12 x

The mli file will have signatures of this form:

val sizeof_pcap_packet : int
val get_pcap_packet_ts_sec : Cstruct.t -> Cstruct.uint32
val set_pcap_packet_ts_sec : Cstruct.t -> Cstruct.uint32 -> unit
val get_pcap_packet_ts_usec : Cstruct.t -> Cstruct.uint32
val set_pcap_packet_ts_usec : Cstruct.t -> Cstruct.uint32 -> unit
val get_pcap_packet_incl_len : Cstruct.t -> Cstruct.uint32
val set_pcap_packet_incl_len : Cstruct.t -> Cstruct.uint32 -> unit
val get_pcap_packet_orig_len : Cstruct.t -> Cstruct.uint32
val set_pcap_packet_orig_len : Cstruct.t -> Cstruct.uint32 -> unit
val hexdump_pcap_packet_to_buffer : Buffer.t -> pcap_packet -> unit
val hexdump_pcap_packet : Cstruct.t -> unit

val sizeof_ethernet : int
val get_ethernet_dst : Cstruct.t -> Cstruct.t
val copy_ethernet_dst : Cstruct.t -> string
val set_ethernet_dst : string -> int -> Cstruct.t -> unit
val blit_ethernet_dst : Cstruct.t -> int -> Cstruct.t -> unit
val get_ethernet_src : Cstruct.t -> Cstruct.t
val copy_ethernet_src : Cstruct.t -> string
val set_ethernet_src : string -> int -> Cstruct.t -> unit
val blit_ethernet_src : Cstruct.t -> int -> Cstruct.t -> unit
val get_ethernet_ethertype : Cstruct.t -> Cstruct.uint16
val set_ethernet_ethertype : Cstruct.t -> Cstruct.uint16 -> unit
val hexdump_ethernet_to_buffer : Buffer.t -> Cstruct.t -> unit
val hexdump_ethernet : Cstruct.t -> unit

The hexdump functions above are convenient pretty-printing functions to help you debug, and aren't intended to be high performance.

You can also declare C-like enums:

[%%cenum
type foo32 =
  | ONE32
  | TWO32 [@id 0xfffffffel]
  | THREE32
  [@@uint32_t]
]

[%%cenum
type bar16 =
  | ONE [@id 1]
  | TWO
  | FOUR [@id 4]
  | FIVE
  [@@uint16_t]
]

This generates signatures of the form:

type foo32 = | ONE32 | TWO32 | THREE32
val int_to_foo32 : int32 -> foo32 option
val foo32_to_int : foo32 -> int32
val foo32_to_string : foo32 -> string
val string_to_foo32 : string -> foo32 option
type bar16 = | ONE | TWO | FOUR | FIVE
val int_to_bar16 : int -> bar16 option
val bar16_to_int : bar16 -> int
val bar16_to_string : bar16 -> string
val string_to_bar16 : string -> bar16 option

You can also add a (sexp) decorator to output s-expression convertors for use with the sexplib library.

[%%cenum
type foo64 =
  | ONE64
  | TWO64
  | THREE64
  [@@uint64_t] [@@sexp]
]

And sexp_of_foo64 and foo64_of_sexp functions will also be available. The representation of the Sexp is the string representation of the enum.

If you do use the sexp decorator, then you will also need to add sexplib to the dependency list for your package (both in the dune file and the opam file).

Please see the ppx_test/ directory for more in-depth examples.

Dependencies (2)

  1. dune >= "1.0"
  2. ocaml >= "4.03.0"

Dev Dependencies (1)

  1. alcotest with-test

  1. albatross < "1.4.3"
  2. angstrom < "0.7.0"
  3. asn1-combinators < "0.2.6"
  4. balancer
  5. bip32
  6. buffer-pool
  7. certify
  8. chacha < "1.1.0"
  9. colombe < "0.2.0"
  10. conduit-mirage
  11. conex < "0.10.0"
  12. conex-mirage-crypto
  13. cowabloga
  14. crc
  15. cstruct-lwt = "3.7.0"
  16. datakit-server
  17. depyt
  18. dns < "6.3.0"
  19. dns-client < "6.3.0"
  20. dns-forward
  21. dnssd
  22. dream < "1.0.0~alpha2"
  23. duff < "0.3"
  24. eqaf >= "0.8" & < "0.10"
  25. eqaf-cstruct
  26. fat-filesystem >= "0.13.0" & < "0.15.1"
  27. fiat-p256
  28. git < "3.2.0"
  29. github-hooks
  30. gluten-mirage < "0.3.0"
  31. gpt
  32. h2-mirage
  33. hacl-star >= "0.7.0"
  34. hacl_x25519
  35. hex
  36. hkdf
  37. httpun-mirage
  38. httpun-ws-mirage
  39. hvsock < "3.0.0"
  40. io-page
  41. io-page-unix
  42. ipv6-multicast
  43. irmin-git
  44. irmin-indexeddb
  45. key-parsers < "1.2.1"
  46. launchd
  47. learn-ocaml-client
  48. mirage-block >= "2.0.1"
  49. mirage-block-combinators < "3.0.2"
  50. mirage-block-lwt
  51. mirage-block-unix < "2.14.2"
  52. mirage-btrees
  53. mirage-channel = "4.0.1"
  54. mirage-channel-lwt
  55. mirage-conduit
  56. mirage-console-lwt
  57. mirage-crypto < "0.10.7"
  58. mirage-crypto-rng < "0.10.7"
  59. mirage-crypto-rng-mirage < "1.1.0"
  60. mirage-flow >= "3.0.0"
  61. mirage-flow-lwt
  62. mirage-fs >= "4.0.0"
  63. mirage-fs-lwt
  64. mirage-kv-lwt
  65. mirage-kv-unix
  66. mirage-net >= "4.0.0"
  67. mirage-net-lwt
  68. mirage-net-macosx
  69. mirage-net-solo5
  70. mirage-net-unikraft
  71. mirage-net-unix
  72. mirage-profile
  73. mirage-protocols-lwt
  74. mirage-random
  75. mirage-solo5 < "0.10.0"
  76. mirage-stack-lwt
  77. mirage-tc
  78. mirage-types-lwt
  79. mirage-xen
  80. monorobot
  81. mstruct
  82. nbd = "4.0.3"
  83. nocrypto
  84. noise
  85. pcap-format >= "0.5.2"
  86. pf-qubes
  87. protocol-9p = "2.0.1"
  88. protocol-9p-tool = "0.12.0" | >= "2.0.0" & < "2.0.2"
  89. protocol-9p-unix < "2.0.2"
  90. qcow >= "0.11.0"
  91. qcow-tool
  92. randomconv < "0.2.0"
  93. rawlink < "1.2"
  94. resp-mirage = "0.10.0"
  95. rfc6287
  96. salsa20 < "1.2.0"
  97. salsa20-core >= "0.3.0" & < "1.1.0"
  98. secp256k1-internal < "0.3.0"
  99. sendmail >= "0.4.1" & < "0.5.0"
  100. shared-memory-ring-lwt
  101. slack
  102. ssh-agent
  103. tls < "0.14.1"
  104. tls-liquidsoap
  105. uecc
  106. vchan < "6.0.1"
  107. vchan-unix
  108. vchan-xen
  109. vhd-format >= "0.12.0" & < "0.13.0"
  110. vhd-format-lwt < "0.13.0"
  111. vmnet
  112. x509 < "0.14.1"
  113. xen-gnt

Conflicts

None

OCaml

Innovation. Community. Security.