1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
|
(* Configurable parameters *)
val database_name : string ref
(** Name of database file *)
val html_add_tags : bool ref
(** Whether to treat HTML tag names as words *)
val html_tag_attr : Str.regexp ref
(** Regexp matching [tag/attr] strings denoting pairs of HTML tag and
attribute names. If a tag and attribute pair matches, the associated
value is added to the text. *)
val mail_headers : Str.regexp ref
(** Regexp matching names of e-mail headers that must be analyzed. *)
val spam_header : string ref
(** Name of header added with spam / not-spam info (default: "X-Spam") *)
val attachments_header : string ref
(** Name of header added with attachment summary (default: "X-Attachments") *)
val summarize_attachments : bool ref
(** Whether to generate the attachment summary *)
val num_words_retained : int ref
(** Number of meaningful words to retain for computing final prob. *)
val max_repetitions : int ref
(** Among the meaningful words, max number of time a given word
can appear. *)
val low_freq_limit : float ref
(** Lower limit for word frequencies. Default is 0.01. *)
val high_freq_limit : float ref
(** Upper limit for word frequencies. Default is 0.99. *)
val min_meaningful_words : int ref
(** Number of meaningful words below which mails are classified as unknown *)
val good_mail_prob : float ref
(** Spam probability below which mails are classified as good *)
val spam_mail_prob : float ref
(** Spam probability below which mails are classified as spam *)
val options : (string * Configfile.value) list
(** List of configurable parameters *)
|