sig
type raw_alignment = {
qname : string;
flag : int;
rname : string;
pos : int;
mapq : int;
cigar : string;
rnext : string;
pnext : int;
tlen : int;
seq : string;
qual : string;
optional : (string * char * string) list;
}
type raw_item =
[ `alignment of Biocaml_sam.raw_alignment
| `comment of string
| `header of string * (string * string) list ]
type reference_sequence = {
ref_name : string;
ref_length : int;
ref_assembly_identifier : string option;
ref_checksum : string option;
ref_species : string option;
ref_uri : string option;
ref_unknown : (string * string) list;
}
val reference_sequence :
?assembly_identifier:string ->
?checksum:string ->
?species:string ->
?uri:string ->
?unknown_data:(string * string) list ->
string -> int -> Biocaml_sam.reference_sequence
module Flags :
sig
type t = private int
val of_int : int -> Biocaml_sam.Flags.t
val has_multiple_segments : Biocaml_sam.Flags.t -> bool
val each_segment_properly_aligned : Biocaml_sam.Flags.t -> bool
val segment_unmapped : Biocaml_sam.Flags.t -> bool
val next_segment_unmapped : Biocaml_sam.Flags.t -> bool
val seq_is_reverse_complemented : Biocaml_sam.Flags.t -> bool
val next_seq_is_reverse_complemented : Biocaml_sam.Flags.t -> bool
val first_segment : Biocaml_sam.Flags.t -> bool
val last_segment : Biocaml_sam.Flags.t -> bool
val secondary_alignment : Biocaml_sam.Flags.t -> bool
val not_passing_quality_controls : Biocaml_sam.Flags.t -> bool
val pcr_or_optical_duplicate : Biocaml_sam.Flags.t -> bool
val t_of_sexp : Sexplib.Sexp.t -> Biocaml_sam.Flags.t
val sexp_of_t : Biocaml_sam.Flags.t -> Sexplib.Sexp.t
end
type cigar_op =
[ `D of int
| `Eq of int
| `H of int
| `I of int
| `M of int
| `N of int
| `P of int
| `S of int
| `X of int ]
type optional_content_value =
[ `array of char * Biocaml_sam.optional_content_value array
| `char of char
| `float of float
| `int of int
| `string of string ]
type optional_content =
(string * char * Biocaml_sam.optional_content_value) list
type alignment = {
query_template_name : string;
flags : Biocaml_sam.Flags.t;
reference_sequence :
[ `name of string
| `none
| `reference_sequence of Biocaml_sam.reference_sequence ];
position : int option;
mapping_quality : int option;
cigar_operations : Biocaml_sam.cigar_op array;
next_reference_sequence :
[ `name of string
| `none
| `qname
| `reference_sequence of Biocaml_sam.reference_sequence ];
next_position : int option;
template_length : int option;
sequence : [ `none | `reference | `string of string ];
quality : Biocaml_phred_score.t array;
optional_content : Biocaml_sam.optional_content;
}
type item =
[ `alignment of Biocaml_sam.alignment
| `comment of string
| `header of string * (string * string) list
| `header_line of
string * [ `coordinate | `queryname | `unknown | `unsorted ] *
(string * string) list
| `reference_sequence_dictionary of
Biocaml_sam.reference_sequence array ]
module Error :
sig
type optional_content_parsing =
[ `wrong_optional of
(string * char * string) list *
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_array of
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_type of string ]
| `wrong_type of string ] ]
type string_to_raw =
[ `incomplete_input of Biocaml_pos.t * string list * string option
| `invalid_header_tag of Biocaml_pos.t * string
| `invalid_tag_value_list of Biocaml_pos.t * string list
| `not_an_int of Biocaml_pos.t * string * string
| `wrong_alignment of Biocaml_pos.t * string
| `wrong_optional_field of Biocaml_pos.t * string ]
type raw_to_item =
[ `comment_after_end_of_header of int * string
| `duplicate_in_reference_sequence_dictionary of
Biocaml_sam.reference_sequence array
| `header_after_end_of_header of
int * (string * (string * string) list)
| `header_line_not_first of int
| `header_line_without_version of (string * string) list
| `header_line_wrong_sorting of string
| `missing_ref_sequence_length of (string * string) list
| `missing_ref_sequence_name of (string * string) list
| `wrong_cigar_text of string
| `wrong_flag of Biocaml_sam.raw_alignment
| `wrong_mapq of Biocaml_sam.raw_alignment
| `wrong_optional of
(string * char * string) list *
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_array of
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_type of string ]
| `wrong_type of string ]
| `wrong_phred_scores of Biocaml_sam.raw_alignment
| `wrong_pnext of Biocaml_sam.raw_alignment
| `wrong_pos of Biocaml_sam.raw_alignment
| `wrong_qname of Biocaml_sam.raw_alignment
| `wrong_ref_sequence_length of (string * string) list
| `wrong_tlen of Biocaml_sam.raw_alignment ]
type item_to_raw = [ `wrong_phred_scores of Biocaml_sam.alignment ]
type parse =
[ `comment_after_end_of_header of int * string
| `duplicate_in_reference_sequence_dictionary of
Biocaml_sam.reference_sequence array
| `header_after_end_of_header of
int * (string * (string * string) list)
| `header_line_not_first of int
| `header_line_without_version of (string * string) list
| `header_line_wrong_sorting of string
| `incomplete_input of Biocaml_pos.t * string list * string option
| `invalid_header_tag of Biocaml_pos.t * string
| `invalid_tag_value_list of Biocaml_pos.t * string list
| `missing_ref_sequence_length of (string * string) list
| `missing_ref_sequence_name of (string * string) list
| `not_an_int of Biocaml_pos.t * string * string
| `wrong_alignment of Biocaml_pos.t * string
| `wrong_cigar_text of string
| `wrong_flag of Biocaml_sam.raw_alignment
| `wrong_mapq of Biocaml_sam.raw_alignment
| `wrong_optional of
(string * char * string) list *
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_array of
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_type of string ]
| `wrong_type of string ]
| `wrong_optional_field of Biocaml_pos.t * string
| `wrong_phred_scores of Biocaml_sam.raw_alignment
| `wrong_pnext of Biocaml_sam.raw_alignment
| `wrong_pos of Biocaml_sam.raw_alignment
| `wrong_qname of Biocaml_sam.raw_alignment
| `wrong_ref_sequence_length of (string * string) list
| `wrong_tlen of Biocaml_sam.raw_alignment ]
val optional_content_parsing_of_sexp :
Sexplib.Sexp.t -> Biocaml_sam.Error.optional_content_parsing
val optional_content_parsing_of_sexp__ :
Sexplib.Sexp.t -> Biocaml_sam.Error.optional_content_parsing
val sexp_of_optional_content_parsing :
Biocaml_sam.Error.optional_content_parsing -> Sexplib.Sexp.t
val string_to_raw_of_sexp :
Sexplib.Sexp.t -> Biocaml_sam.Error.string_to_raw
val string_to_raw_of_sexp__ :
Sexplib.Sexp.t -> Biocaml_sam.Error.string_to_raw
val sexp_of_string_to_raw :
Biocaml_sam.Error.string_to_raw -> Sexplib.Sexp.t
val raw_to_item_of_sexp :
Sexplib.Sexp.t -> Biocaml_sam.Error.raw_to_item
val raw_to_item_of_sexp__ :
Sexplib.Sexp.t -> Biocaml_sam.Error.raw_to_item
val sexp_of_raw_to_item :
Biocaml_sam.Error.raw_to_item -> Sexplib.Sexp.t
val item_to_raw_of_sexp :
Sexplib.Sexp.t -> Biocaml_sam.Error.item_to_raw
val item_to_raw_of_sexp__ :
Sexplib.Sexp.t -> Biocaml_sam.Error.item_to_raw
val sexp_of_item_to_raw :
Biocaml_sam.Error.item_to_raw -> Sexplib.Sexp.t
val parse_of_sexp : Sexplib.Sexp.t -> Biocaml_sam.Error.parse
val parse_of_sexp__ : Sexplib.Sexp.t -> Biocaml_sam.Error.parse
val sexp_of_parse : Biocaml_sam.Error.parse -> Sexplib.Sexp.t
end
val in_channel_to_item_stream :
?buffer_size:int ->
?filename:string ->
Pervasives.in_channel ->
(Biocaml_sam.item, Biocaml_sam.Error.parse) Core.Result.t Stream.t
module Low_level_parsing :
sig
val parse_cigar_text :
string ->
(Biocaml_sam.cigar_op array, [> `wrong_cigar_text of string ])
Core.Result.t
val parse_optional_content :
(string * char * string) list ->
(Biocaml_sam.optional_content,
Biocaml_sam.Error.optional_content_parsing)
Core.Result.t
val parse_header_line :
'a ->
string ->
([> `comment of string | `header of string * (string * string) list ],
[> `invalid_header_tag of 'a * string
| `invalid_tag_value_list of 'a * string list ])
Core.Result.t
val expand_header_line :
(string * string) list ->
([> `header_line of
string * [ `coordinate | `queryname | `unknown | `unsorted ] *
(string * string) list ],
[> `header_line_without_version of (string * string) list
| `header_line_wrong_sorting of string ])
Core.Result.t
end
module Transform :
sig
val string_to_raw :
?filename:string ->
unit ->
(string,
(Biocaml_sam.raw_item, [> Biocaml_sam.Error.string_to_raw ])
Core.Result.t)
Biocaml_transform.t
val raw_to_string :
unit -> (Biocaml_sam.raw_item, string) Biocaml_transform.t
val raw_to_item :
unit ->
(Biocaml_sam.raw_item,
(Biocaml_sam.item, [> Biocaml_sam.Error.raw_to_item ]) Core.Result.t)
Biocaml_transform.t
val item_to_raw :
unit ->
(Biocaml_sam.item,
(Biocaml_sam.raw_item, Biocaml_sam.Error.item_to_raw) Core.Result.t)
Biocaml_transform.t
end
val raw_alignment_of_sexp : Sexplib.Sexp.t -> Biocaml_sam.raw_alignment
val sexp_of_raw_alignment : Biocaml_sam.raw_alignment -> Sexplib.Sexp.t
val raw_item_of_sexp : Sexplib.Sexp.t -> Biocaml_sam.raw_item
val raw_item_of_sexp__ : Sexplib.Sexp.t -> Biocaml_sam.raw_item
val sexp_of_raw_item : Biocaml_sam.raw_item -> Sexplib.Sexp.t
val reference_sequence_of_sexp :
Sexplib.Sexp.t -> Biocaml_sam.reference_sequence
val sexp_of_reference_sequence :
Biocaml_sam.reference_sequence -> Sexplib.Sexp.t
val cigar_op_of_sexp : Sexplib.Sexp.t -> Biocaml_sam.cigar_op
val cigar_op_of_sexp__ : Sexplib.Sexp.t -> Biocaml_sam.cigar_op
val sexp_of_cigar_op : Biocaml_sam.cigar_op -> Sexplib.Sexp.t
val optional_content_value_of_sexp :
Sexplib.Sexp.t -> Biocaml_sam.optional_content_value
val optional_content_value_of_sexp__ :
Sexplib.Sexp.t -> Biocaml_sam.optional_content_value
val sexp_of_optional_content_value :
Biocaml_sam.optional_content_value -> Sexplib.Sexp.t
val optional_content_of_sexp :
Sexplib.Sexp.t -> Biocaml_sam.optional_content
val sexp_of_optional_content :
Biocaml_sam.optional_content -> Sexplib.Sexp.t
val alignment_of_sexp : Sexplib.Sexp.t -> Biocaml_sam.alignment
val sexp_of_alignment : Biocaml_sam.alignment -> Sexplib.Sexp.t
val item_of_sexp : Sexplib.Sexp.t -> Biocaml_sam.item
val item_of_sexp__ : Sexplib.Sexp.t -> Biocaml_sam.item
val sexp_of_item : Biocaml_sam.item -> Sexplib.Sexp.t
end