ocaml/stdlib/scanf.mli

(***********************************************************************)
(*                                                                     *)
(*                           Objective Caml                            *)
(*                                                                     *)
(*            Pierre Weis, projet Cristal, INRIA Rocquencourt          *)
(*                                                                     *)
(*  Copyright 2002 Institut National de Recherche en Informatique et   *)
(*  en Automatique.  All rights reserved.  This file is distributed    *)
(*  under the terms of the GNU Library General Public License, with    *)
(*  the special exception on linking described in file ../LICENSE.     *)
(*                                                                     *)
(***********************************************************************)

(* $Id$ *)

(** Formatted input functions. *)

(** {6 Scanning buffers} *)
module Scanning : sig

type scanbuf;;
(** The type of scanning buffers. A scanning buffer is the argument passed
   to the scanning functions used by the [scanf] family of functions.
   The scanning buffer holds the current state of the scan, plus
   a function to get the next char from the input, and a token buffer
   to store the string matched so far. *)

val from_string : string -> scanbuf;;
(** [Scanning.from_string s] returns a scanning buffer which reads
    from the given string.
    Reading starts from the first character in the string.
    The end-of-input condition is set when the end of the string is reached. *)

val from_channel : in_channel -> scanbuf;;
(** [Scanning.from_channel inchan] returns a scanning buffer which reads
    from the input channel [inchan], at the current reading position. *)

val from_function : (unit -> char) -> scanbuf;;
(** [Scanning.from_function f] returns a scanning buffer with
    the given function as its reading method.
    When scanning needs one more character, the given function is called.
    When the function has no more character to provide, it must set
    an end of input condition by raising the exception [End_of_file]. *)

end;;

val fscanf : in_channel -> ('a, Scanning.scanbuf, 'b) format -> 'a -> 'b;;
(** [fscanf inchan format f] reads tokens from the channel [inchan] according
   to the format string [format], converts these tokens to values, and
   applies these values to the function [f].
   The result of this application of [f] is the result of the whole construct.

   The format is a character string which contains three types of
   objects:
   - plain characters, which are simply matched with the
   input channel,
   - conversion specifications, each of which causes reading and
   conversion of one argument for [f],
   - scanning indications to specify boundaries of tokens and the
   amount of space to skip between tokens.

   Among plain characters the white space character (ASCII code 32) has a
   special meaning: it maches a ``space'', that is any number of tab,
   white space, newline and return. Hence, a space in the format
   matches any number of white spaces in the input.

   Conversion specifications consist in the [%] character, followed
   by optional field width, followed by one or two conversion
   characters. The conversion characters and their meanings are:
   - [d]: reads an optionally signed decimal integer.
   - [i]: reads an optionally signed integer
     (usual input formats for hexadecimal ([0x\[d\]+] and [0X\[d+\]]),
      octal ([0o\[d\]+]), and binary [0b\[d\]+] notations are understood).
   - [u]: reads an unsigned decimal integer.
   - [x]: reads an unsigned hexadecimal integer with lowercase letters.
   - [X]: reads an unsigned hexadecimal integer with uppercase letters.
   - [o]: reads an unsigned octal integer.
   - [s]: reads a string argument (by default strings end with a space).
   - [S]: reads a delimited string argument (delimitors and special
     escaped characters follow the lexical conventions of Objective Caml).
   - [c]: reads a single character.
   - [C]: reads a single delimited character (delimitors and special
     escaped characters follow the lexical conventions of Objective Caml).
   - [f], [e], [E], [g], [G]: reads an optionally signed floating-point number
     in decimal notation, in the style [dddd.ddd e/E+-dd].
   - [b]: reads a boolean argument ([true] or [false]).
   - [ld], [li], [lu], [lx], [lX], [lo]: reads an [int32] argument to
     the format specified by the second letter (decimal, hexadecimal, etc).
   - [nd], [ni], [nu], [nx], [nX], [no]: reads a [nativeint] argument to
     the format specified by the second letter.
   - [Ld], [Li], [Lu], [Lx], [LX], [Lo]: reads an [int64] argument to
     the format specified by the second letter.
   - [\[ range \]]: reads characters that maches one of the characters
     mentionned in the range of characters [range] (or not mentionned in
     it, if the range starts by [^]). Returns a [string] that can be
     empty, if no character in the input matches the range.
   - [N]: applies [f] to the number of characters read so far.
   - [%]: matches one [%] character in the input.

   The field widths are composed of an optional integer literal
   indicating the maximal width of the token to read.
   For instance, [%6d] reads an integer, having at most 6 decimal digits;
   and [%4f] reads a float with 4 characters.

   The scanning indication are introduced by a [@] character, followed
   by any character [c], that matches a plain [c] character in the
   input. If a scanning indication immediately follows a [s]
   conversion specification, it specifies the boundary of the token
   (that is the character immediately after the end of the token). For
   instance, ["%s@\t"] reads the string preceding the next tabulation
   character.

   Note: the [scanf] facility is not intended for heavy duty
   lexing and parsing; if you need efficient language syntactic analysis,
   use the corresponding devoted libraries. *)

val scanf : ('a, Scanning.scanbuf, 'b) format -> 'a -> 'b;;
(** Same as {!Scanf.fscanf}, but inputs from [stdin]. *)

val bscanf :
  Scanning.scanbuf -> ('a, Scanning.scanbuf, 'b) format -> 'a -> 'b;;
(** Same as {!Scanf.fscanf}, but inputs from the buffer argument. *)

val sscanf : string -> ('a, Scanning.scanbuf, 'b) format -> 'a -> 'b;;
(** Same as {!Scanf.fscanf}, but inputs from the string argument. *)
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`(***********************************************************************)`
			`(* *)`
			`(* Objective Caml *)`
			`(* *)`
			`(* Pierre Weis, projet Cristal, INRIA Rocquencourt *)`
			`(* *)`
			`(* Copyright 2002 Institut National de Recherche en Informatique et *)`
			`(* en Automatique. All rights reserved. This file is distributed *)`
			`(* under the terms of the GNU Library General Public License, with *)`
			`(* the special exception on linking described in file ../LICENSE. *)`
			`(* *)`
			`(***********************************************************************)`

Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4795 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-08 06:51:09 -07:00			`(* $Id$ *)`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00
			`(** Formatted input functions. *)`

Le module Scanning est intégré dans Scanf. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4849 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-27 15:00:09 -07:00			`(** {6 Scanning buffers} *)`
			`module Scanning : sig`

			`type scanbuf;;`
			`(** The type of scanning buffers. A scanning buffer is the argument passed`
			`to the scanning functions used by the [scanf] family of functions.`
			`The scanning buffer holds the current state of the scan, plus`
			`a function to get the next char from the input, and a token buffer`
			`to store the string matched so far. *)`

			`val from_string : string -> scanbuf;;`
			`(** [Scanning.from_string s] returns a scanning buffer which reads`
			`from the given string.`
			`Reading starts from the first character in the string.`
			`The end-of-input condition is set when the end of the string is reached. *)`

			`val from_channel : in_channel -> scanbuf;;`
			`(** [Scanning.from_channel inchan] returns a scanning buffer which reads`
			`from the input channel [inchan], at the current reading position. *)`

			`val from_function : (unit -> char) -> scanbuf;;`
			`(** [Scanning.from_function f] returns a scanning buffer with`
			`the given function as its reading method.`
			`When scanning needs one more character, the given function is called.`
			`When the function has no more character to provide, it must set`
			`an end of input condition by raising the exception [End_of_file]. *)`

			`end;;`

Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4805 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-12 11:40:15 -07:00			`val fscanf : in_channel -> ('a, Scanning.scanbuf, 'b) format -> 'a -> 'b;;`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`(** [fscanf inchan format f] reads tokens from the channel [inchan] according`
			`to the format string [format], converts these tokens to values, and`
			`applies these values to the function [f].`
			`The result of this application of [f] is the result of the whole construct.`
Typos. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4810 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-15 13:28:57 -07:00
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4840 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-27 00:05:36 -07:00			`The format is a character string which contains three types of`
			`objects:`
			`- plain characters, which are simply matched with the`
			`input channel,`
			`- conversion specifications, each of which causes reading and`
			`conversion of one argument for [f],`
			`- scanning indications to specify boundaries of tokens and the`
			`amount of space to skip between tokens.`

			`Among plain characters the white space character (ASCII code 32) has a`
			special meaning: it maches a ``space'', that is any number of tab,
			`white space, newline and return. Hence, a space in the format`
			`matches any number of white spaces in the input.`
Typos. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4810 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-15 13:28:57 -07:00
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`Conversion specifications consist in the [%] character, followed`
			`by optional field width, followed by one or two conversion`
			`characters. The conversion characters and their meanings are:`
Typos. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4810 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-15 13:28:57 -07:00			`- [d]: reads an optionally signed decimal integer.`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`- [i]: reads an optionally signed integer`
			`(usual input formats for hexadecimal ([0x\[d\]+] and [0X\[d+\]]),`
Typos. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4810 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-15 13:28:57 -07:00			`octal ([0o\[d\]+]), and binary [0b\[d\]+] notations are understood).`
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4825 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-17 01:17:52 -07:00			`- [u]: reads an unsigned decimal integer.`
			`- [x]: reads an unsigned hexadecimal integer with lowercase letters.`
			`- [X]: reads an unsigned hexadecimal integer with uppercase letters.`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`- [o]: reads an unsigned octal integer.`
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4840 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-27 00:05:36 -07:00			`- [s]: reads a string argument (by default strings end with a space).`
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4805 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-12 11:40:15 -07:00			`- [S]: reads a delimited string argument (delimitors and special`
			`escaped characters follow the lexical conventions of Objective Caml).`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`- [c]: reads a single character.`
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4805 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-12 11:40:15 -07:00			`- [C]: reads a single delimited character (delimitors and special`
			`escaped characters follow the lexical conventions of Objective Caml).`
Les formats [f], [e], [E], [g], [G] sont équivalents. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4848 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-27 13:41:19 -07:00			`- [f], [e], [E], [g], [G]: reads an optionally signed floating-point number`
			`in decimal notation, in the style [dddd.ddd e/E+-dd].`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`- [b]: reads a boolean argument ([true] or [false]).`
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4795 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-08 06:51:09 -07:00			`- [ld], [li], [lu], [lx], [lX], [lo]: reads an [int32] argument to`
			`the format specified by the second letter (decimal, hexadecimal, etc).`
			`- [nd], [ni], [nu], [nx], [nX], [no]: reads a [nativeint] argument to`
			`the format specified by the second letter.`
			`- [Ld], [Li], [Lu], [Lx], [LX], [Lo]: reads an [int64] argument to`
			`the format specified by the second letter.`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`- [\[ range \]]: reads characters that maches one of the characters`
typos git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4829 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-20 12:22:21 -07:00			`mentionned in the range of characters [range] (or not mentionned in`
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4840 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-27 00:05:36 -07:00			`it, if the range starts by [^]). Returns a [string] that can be`
			`empty, if no character in the input matches the range.`
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4825 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-17 01:17:52 -07:00			`- [N]: applies [f] to the number of characters read so far.`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`- [%]: matches one [%] character in the input.`

			`The field widths are composed of an optional integer literal`
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4840 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-27 00:05:36 -07:00			`indicating the maximal width of the token to read.`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`For instance, [%6d] reads an integer, having at most 6 decimal digits;`
			`and [%4f] reads a float with 4 characters.`

Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4840 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-27 00:05:36 -07:00			`The scanning indication are introduced by a [@] character, followed`
			`by any character [c], that matches a plain [c] character in the`
			`input. If a scanning indication immediately follows a [s]`
			`conversion specification, it specifies the boundary of the token`
			`(that is the character immediately after the end of the token). For`
			`instance, ["%s@\t"] reads the string preceding the next tabulation`
			`character.`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00
			`Note: the [scanf] facility is not intended for heavy duty`
			`lexing and parsing; if you need efficient language syntactic analysis,`
			`use the corresponding devoted libraries. *)`

Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4805 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-12 11:40:15 -07:00			`val scanf : ('a, Scanning.scanbuf, 'b) format -> 'a -> 'b;;`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`(** Same as {!Scanf.fscanf}, but inputs from [stdin]. *)`

			`val bscanf :`
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4805 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-12 11:40:15 -07:00			`Scanning.scanbuf -> ('a, Scanning.scanbuf, 'b) format -> 'a -> 'b;;`
			`(** Same as {!Scanf.fscanf}, but inputs from the buffer argument. *)`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00
Documentation. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4805 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-12 11:40:15 -07:00			`val sscanf : string -> ('a, Scanning.scanbuf, 'b) format -> 'a -> 'b;;`
Introducing a ``scanf'' facility in Objective Caml. git-svn-id: http://caml.inria.fr/svn/ocaml/trunk@4780 f963ae5c-01c2-4b8c-9fe0-0dff7051ff02 2002-05-07 00:41:12 -07:00			`(** Same as {!Scanf.fscanf}, but inputs from the string argument. *)`