/usr/lib/ocaml/netstring/netencoding.mli is in libocamlnet-ocaml-dev 4.0.4-1build3.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 | (* $Id: netencoding.mli 2195 2015-01-01 12:23:39Z gerd $
* ----------------------------------------------------------------------
*
*)
(** Base64, Quoted Printable, URL encoding, HTML escaping *)
(* *********************************************************************)
(* Several encodings important for the net *)
(* *********************************************************************)
(* *********************************************************************)
(* Base 64 encoding *)
(* *********************************************************************)
(* See RFC 2045 for a description of Base 64 encoding. *)
(* THREAD-SAFETY:
* All Base64 functions are reentrant and thus thread-safe.
*)
module Base64 : sig
(** Base64 encoding as described in RFC 2045 *)
val encode : ?pos:int -> ?len:int -> ?linelength:int -> ?crlf:bool ->
string -> string
(** Compute the "base 64" encoding of the given string argument.
* Note that the result is a string that only contains the characters
* a-z, A-Z, 0-9, +, /, =, and optionally spaces, CR and LF characters.
*
* If [pos] and/or [len] are passed, only the substring starting at
* [pos] (default: 0) with length [len] (default: rest of the string)
* is encoded.
*
* The result is divided up into lines not longer than [linelength]
* (without counting the line separator); default: do not divide lines.
* If [linelength] is smaller than 4, no line division is performed.
* If [linelength] is not divisible by 4, the produced lines are a
* bit shorter than [linelength].
*
* If [crlf] (default: false) the lines are ended by CRLF; otherwise
* they are only ended by LF.
* (You need the crlf option to produce correct MIME messages.)
*
*)
val url_encode : ?pos:int -> ?len:int -> ?linelength:int -> ?crlf:bool ->
string -> string
(** Same as [encode] but use slightly different characters that can be
* part of URLs without additional encodings.
* The encoded string consists only of the characters a-z, A-Z, 0-9,
* -, /, .
* [url_encode] does {b not} implement the Base 64 encoding as described
* in the standard!
*
* @deprecated Since Ocamlnet 0.98, this function is deprecated,
* as it is non-standard, and it has a confusing name.
*)
val decode : ?pos:int -> ?len:int -> ?url_variant:bool ->
?accept_spaces:bool -> string -> string
(** Decodes the given string argument.
*
* If [pos] and/or [len] are passed, only the substring starting at
* [pos] (default: 0) with length [len] (default: rest of the string)
* is decoded.
*
* If [url_variant] (default: [true]) is set, the functions also
* accepts the characters '-' and '.' as produced by [url_encode].
*
* If [accept_spaces] (default: [false]) is set, the function ignores
* white space contained in the string to decode (otherwise the
* function fails if it finds white space). Furthermore, the character
* '>' is considered as "space", too (so you don't have trouble with
* mbox mailboxes that accidentally quote "From").
*)
class encoding_pipe : ?linelength:int -> ?crlf:bool -> unit ->
Netchannels.pipe
(** This pipe encodes the data written into the pipe.
* [linelength] and [crlf] work as in [encode].
*)
class decoding_pipe : ?url_variant:bool -> ?accept_spaces:bool -> unit ->
Netchannels.pipe
(** This pipe decodes the data written into the pipe.
* [url_variant] and [accept_spaces] work as in [decode].
*)
end
(* *********************************************************************)
(* Quoted printable encoding *)
(* *********************************************************************)
(* THREAD-SAFETY:
* All QuotedPrintable functions are reentrant and thus thread-safe.
*)
module QuotedPrintable :
sig
(** This module implements the "Quoted Printable" encoding as
* described in RFC 2045.
*
* This implementation assumes that the encoded string has a text MIME
* type. On input both CR/LF and LF are accepted as end-of-line (eol) terminators,
* but the output normalizes the eol delimiter as the [crlf] argument
* specifies. Note that this implies that
* - If [crlf], the output uses CR/LF as line separator as MIME prescribes
* - the encoding is not invertible for binary data
*)
val encode : ?crlf:bool -> ?pos:int -> ?len:int -> string -> string
(** Encodes the string and returns it.
*
* Since OcamlNet 0.98, soft line breaks are added to the output
* to ensure that all output lines have a length <= 76 bytes.
*
* Note unsafe characters:
* As recommended by RFC 2045, the characters [!#$\@[]^`|{}~]
* and the double quotes
* are additionally represented as hex tokens.
* Furthermore, the letter 'F' is considered as unsafe if it
* occurs at the beginning of the line, so the encoded text
* never contains the word "From" at the beginning of a line.
*
* If [pos] and/or [len] are passed, only the substring starting at
* [pos] (default: 0) with length [len] (default: rest of the string)
* is encoded.
*
* If [crlf] is set (the default), the output text uses CR/LF as
* line separator. Otherwise only LF is used.
*)
val decode : ?pos:int -> ?len:int -> string -> string
(** Decodes the string and returns it.
*
* Most format errors cause an [Invalid_argument] exception.
*
* If [pos] and/or [len] are passed, only the substring starting at
* [pos] (default: 0) with length [len] (default: rest of the string)
* is decoded.
*)
class encoding_pipe : ?crlf:bool -> unit -> Netchannels.pipe
(** This pipe encodes the data written into the pipe. *)
class decoding_pipe : unit -> Netchannels.pipe
(** This pipe decodes the data written into the pipe. *)
end
(* *********************************************************************)
(* Q encoding *)
(* *********************************************************************)
(* See RFC 2047.
* The functions behave similar to those of QuotedPrintable.
*)
(* THREAD-SAFETY:
* All Q functions are reentrant and thus thread-safe.
*)
module Q :
sig
(** The "Q" encoding as described by RFC 2047. *)
val encode : ?pos:int -> ?len:int -> string -> string
(** Note:
* All characters except alphanumeric characters are protected by
* hex tokens.
* In particular, spaces are represented as "=20", not as "_".
*)
val decode : ?pos:int -> ?len:int -> string -> string
end
(* *********************************************************************)
(* B encoding *)
(* *********************************************************************)
(* The B encoding of RFC 2047 is the same as Base64. *)
(* *********************************************************************)
(* URL-encoding *)
(* *********************************************************************)
(* THREAD-SAFETY:
* The Url functions are thread-safe.
*)
module Url :
sig
(** Encoding/Decoding within URLs:
*
* The following two functions perform the '%'-substitution for
* characters that may otherwise be interpreted as metacharacters.
*
* According to: RFC 1738, RFC 1630
*
* Option [plus]: This option has been added because there are some
* implementations that do not map ' ' to '+', for example Javascript's
* [escape] function. The default is [true] because this is the RFC-
* compliant definition.
*)
val decode : ?plus:bool -> ?pos:int -> ?len:int -> string -> string
(** Option [plus]: Whether '+' is converted to space. The default
* is true. If false, '+' is returned as it is.
*
* The optional arguments [pos] and [len] may restrict the string
* to process to this substring.
*)
val encode : ?plus:bool -> string -> string
(** Option [plus]: Whether spaces are converted to '+'. The default
* is true. If false, spaces are converted to "%20", and
* only %xx sequences are produced.
*)
(** URL-encoded parameters:
*
* The following two functions create and analyze URL-encoded parameters.
* Format: [name1=val1&name2=val2&...]
*)
val mk_url_encoded_parameters : (string * string) list -> string
(** The argument is a list of (name,value) pairs. The result is the
* single URL-encoded parameter string.
*)
val dest_url_encoded_parameters : string -> (string * string) list
(** The argument is the URL-encoded parameter string. The result is
* the corresponding list of (name,value) pairs.
* Note: Whitespace within the parameter string is ignored.
* If there is a format error, the function fails.
*)
end
(* *********************************************************************)
(* HTMLization *)
(* *********************************************************************)
(* THREAD-SAFETY:
* The Html functions are thread-safe.
*)
module Html :
sig
(** Encodes characters that need protection by converting them to
* entity references. E.g. ["<"] is converted to ["<"].
* As the entities may be named, there is a dependency on the character
* set.
*)
(* OLD ENCODE/DECODE FUNCTIONS: *)
(** Legacy functions: *)
val encode_from_latin1 : string -> string
(* Encodes the characters 0-8, 11-12, 14-31, '<', '>', '"', '&',
* 127-255. If the characters have a name, a named entity is
* preferred over a numeric entity.
*)
val decode_to_latin1 : string -> string
(* Decodes the string. Unknown named entities are left as they
* are (i.e. decode_to_latin1 "&nonsense;" = "&nonsense;").
* The same applies to numeric entities greater than 255.
*)
(* NEW ENCODE/DECODE FUNCTIONS: *)
(** These functions have a more general interface and should be preferred
* in new programs.
*)
val unsafe_chars_html4 : string
(** The string contains '<', '>', '"', '&' and the control characters
* 0-8, 11-12, 14-31, 127.
*)
val encode : in_enc:Netconversion.encoding ->
?out_enc:Netconversion.encoding -> (* default: `Enc_usascii *)
?prefer_name:bool -> (* default: true *)
?unsafe_chars:string -> (* default: unsafe_chars_html4 *)
unit ->
string ->
string
(** The input string that is encoded as [in_enc] is recoded to
* [out_enc], and the following characters are encoded as HTML
* entity ([&name;] or [&#num;]):
* - The ASCII characters contained in [unsafe_chars]
* - The characters that cannot be represented in [out_enc]. By
* default ([out_enc=`Enc_usascii]), only ASCII characters can be
* represented, and thus all code points >= 128 are encoded as
* HTML entities. If you pass [out_enc=`Enc_utf8], all characters
* can be represented.
*
* For example, the string ["(a<b) & (c>d)"] is encoded as
* ["(a<b) & (c>d)"].
*
* It is required that [out_enc] is an ASCII-compatible encoding.
*
* The option [prefer_name] selects whether named entities (e.g. [<])
* or numeric entities (e.g. [<]) are prefered.
*
* The efficiency of the function can be improved when the same encoding
* is applied to several strings. Create a specialized encoding function
* by passing all arguments up to the unit argument, and apply this
* function several times. For example:
* {[
* let my_enc = encode ~in_enc:`Enc_utf8 () in
* let s1' = my_enc s1 in
* let s2' = my_enc s2 in ...
* ]}
*)
type entity_set = [ `Html | `Xml | `Empty ];;
val decode : in_enc:Netconversion.encoding ->
out_enc:Netconversion.encoding ->
?lookup:(string -> string) -> (* default: see below *)
?subst:(int -> string) -> (* default: see below *)
?entity_base:entity_set -> (* default: `Html *)
unit ->
string ->
string
(** The input string is recoded from [in_enc] to [out_enc], and HTML
* entities ([&name;] or [&#num;]) are resolved. The input encoding
* [in_enc] must be ASCII-compatible.
*
* By default, the function knows all entities defined for HTML 4 (this
* can be changed using [entity_base], see below). If other
* entities occur, the function [lookup] is called and the name of
* the entity is passed as input string to the function. It is
* expected that [lookup] returns the value of the entity, and that this
* value is already encoded as [out_enc].
* By default, [lookup] raises a [Failure] exception.
*
* If a character cannot be represented in the output encoding,
* the function [subst] is called. [subst] must return a substitute
* string for the character.
* By default, [subst] raises a [Failure] exception.
*
* The option [entity_base] determines which set of entities are
* considered as the known entities that can be decoded without
* help by the [lookup] function: [`Html] selects all entities defined
* for HTML 4, [`Xml] selects only [<], [>], [&], ["],
* and ['],
* and [`Empty] selects the empty set (i.e. [lookup] is always called).
*)
end
(* TODO: module with hex routines *)
val to_hex : ?lc:bool -> string -> string
|