sig
type raw_alignment =
Biocaml_sam.raw_alignment = {
qname : string;
flag : int;
rname : string;
pos : int;
mapq : int;
cigar : string;
rnext : string;
pnext : int;
tlen : int;
seq : string;
qual : string;
optional : (string * char * string) list;
}
type raw_item =
[ `alignment of raw_alignment
| `comment of string
| `header of string * (string * string) list ]
type reference_sequence =
Biocaml_sam.reference_sequence = {
ref_name : string;
ref_length : int;
ref_assembly_identifier : string option;
ref_checksum : string option;
ref_species : string option;
ref_uri : string option;
ref_unknown : (string * string) list;
}
val reference_sequence :
?assembly_identifier:string ->
?checksum:string ->
?species:string ->
?uri:string ->
?unknown_data:(string * string) list ->
string -> int -> reference_sequence
module Flags :
sig
type t = Biocaml_sam.Flags.t
val of_int : int -> t
val has_multiple_segments : t -> bool
val each_segment_properly_aligned : t -> bool
val segment_unmapped : t -> bool
val next_segment_unmapped : t -> bool
val seq_is_reverse_complemented : t -> bool
val next_seq_is_reverse_complemented : t -> bool
val first_segment : t -> bool
val last_segment : t -> bool
val secondary_alignment : t -> bool
val not_passing_quality_controls : t -> bool
val pcr_or_optical_duplicate : t -> bool
val t_of_sexp : Sexplib.Sexp.t -> t
val sexp_of_t : t -> Sexplib.Sexp.t
end
type cigar_op =
[ `D of int
| `Eq of int
| `H of int
| `I of int
| `M of int
| `N of int
| `P of int
| `S of int
| `X of int ]
type optional_content_value =
[ `array of char * optional_content_value array
| `char of char
| `float of float
| `int of int
| `string of string ]
type optional_content = (string * char * optional_content_value) list
type alignment =
Biocaml_sam.alignment = {
query_template_name : string;
flags : Flags.t;
reference_sequence :
[ `name of string | `none | `reference_sequence of reference_sequence ];
position : int option;
mapping_quality : int option;
cigar_operations : cigar_op array;
next_reference_sequence :
[ `name of string
| `none
| `qname
| `reference_sequence of reference_sequence ];
next_position : int option;
template_length : int option;
sequence : [ `none | `reference | `string of string ];
quality : Biocaml_phred_score.t array;
optional_content : optional_content;
}
type item =
[ `alignment of alignment
| `comment of string
| `header of string * (string * string) list
| `header_line of
string * [ `coordinate | `queryname | `unknown | `unsorted ] *
(string * string) list
| `reference_sequence_dictionary of reference_sequence array ]
module Error :
sig
type optional_content_parsing =
[ `wrong_optional of
(string * char * string) list *
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_array of
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_type of string ]
| `wrong_type of string ] ]
type string_to_raw =
[ `incomplete_input of Biocaml_pos.t * string list * string option
| `invalid_header_tag of Biocaml_pos.t * string
| `invalid_tag_value_list of Biocaml_pos.t * string list
| `not_an_int of Biocaml_pos.t * string * string
| `wrong_alignment of Biocaml_pos.t * string
| `wrong_optional_field of Biocaml_pos.t * string ]
type raw_to_item =
[ `comment_after_end_of_header of int * string
| `duplicate_in_reference_sequence_dictionary of
reference_sequence array
| `header_after_end_of_header of
int * (string * (string * string) list)
| `header_line_not_first of int
| `header_line_without_version of (string * string) list
| `header_line_wrong_sorting of string
| `missing_ref_sequence_length of (string * string) list
| `missing_ref_sequence_name of (string * string) list
| `wrong_cigar_text of string
| `wrong_flag of raw_alignment
| `wrong_mapq of raw_alignment
| `wrong_optional of
(string * char * string) list *
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_array of
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_type of string ]
| `wrong_type of string ]
| `wrong_phred_scores of raw_alignment
| `wrong_pnext of raw_alignment
| `wrong_pos of raw_alignment
| `wrong_qname of raw_alignment
| `wrong_ref_sequence_length of (string * string) list
| `wrong_tlen of raw_alignment ]
type item_to_raw = [ `wrong_phred_scores of alignment ]
type parse =
[ `comment_after_end_of_header of int * string
| `duplicate_in_reference_sequence_dictionary of
reference_sequence array
| `header_after_end_of_header of
int * (string * (string * string) list)
| `header_line_not_first of int
| `header_line_without_version of (string * string) list
| `header_line_wrong_sorting of string
| `incomplete_input of Biocaml_pos.t * string list * string option
| `invalid_header_tag of Biocaml_pos.t * string
| `invalid_tag_value_list of Biocaml_pos.t * string list
| `missing_ref_sequence_length of (string * string) list
| `missing_ref_sequence_name of (string * string) list
| `not_an_int of Biocaml_pos.t * string * string
| `wrong_alignment of Biocaml_pos.t * string
| `wrong_cigar_text of string
| `wrong_flag of raw_alignment
| `wrong_mapq of raw_alignment
| `wrong_optional of
(string * char * string) list *
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_array of
[ `not_a_char of string
| `not_a_float of string
| `not_an_int of string
| `unknown_type of char
| `wrong_type of string ]
| `wrong_type of string ]
| `wrong_optional_field of Biocaml_pos.t * string
| `wrong_phred_scores of raw_alignment
| `wrong_pnext of raw_alignment
| `wrong_pos of raw_alignment
| `wrong_qname of raw_alignment
| `wrong_ref_sequence_length of (string * string) list
| `wrong_tlen of raw_alignment ]
val optional_content_parsing_of_sexp :
Sexplib.Sexp.t -> optional_content_parsing
val optional_content_parsing_of_sexp__ :
Sexplib.Sexp.t -> optional_content_parsing
val sexp_of_optional_content_parsing :
optional_content_parsing -> Sexplib.Sexp.t
val string_to_raw_of_sexp : Sexplib.Sexp.t -> string_to_raw
val string_to_raw_of_sexp__ : Sexplib.Sexp.t -> string_to_raw
val sexp_of_string_to_raw : string_to_raw -> Sexplib.Sexp.t
val raw_to_item_of_sexp : Sexplib.Sexp.t -> raw_to_item
val raw_to_item_of_sexp__ : Sexplib.Sexp.t -> raw_to_item
val sexp_of_raw_to_item : raw_to_item -> Sexplib.Sexp.t
val item_to_raw_of_sexp : Sexplib.Sexp.t -> item_to_raw
val item_to_raw_of_sexp__ : Sexplib.Sexp.t -> item_to_raw
val sexp_of_item_to_raw : item_to_raw -> Sexplib.Sexp.t
val parse_of_sexp : Sexplib.Sexp.t -> parse
val parse_of_sexp__ : Sexplib.Sexp.t -> parse
val sexp_of_parse : parse -> Sexplib.Sexp.t
end
val in_channel_to_item_stream :
?buffer_size:int ->
?filename:string ->
in_channel -> (item, Error.parse) Core.Result.t Stream.t
module Low_level_parsing :
sig
val parse_cigar_text :
string ->
(cigar_op array, [> `wrong_cigar_text of string ]) Core.Result.t
val parse_optional_content :
(string * char * string) list ->
(optional_content, Error.optional_content_parsing) Core.Result.t
val parse_header_line :
'a ->
string ->
([> `comment of string | `header of string * (string * string) list ],
[> `invalid_header_tag of 'a * string
| `invalid_tag_value_list of 'a * string list ])
Core.Result.t
val expand_header_line :
(string * string) list ->
([> `header_line of
string * [ `coordinate | `queryname | `unknown | `unsorted ] *
(string * string) list ],
[> `header_line_without_version of (string * string) list
| `header_line_wrong_sorting of string ])
Core.Result.t
end
module Transform :
sig
val string_to_raw :
?filename:string ->
unit ->
(string, (raw_item, [> Error.string_to_raw ]) Core.Result.t)
Biocaml_transform.t
val raw_to_string : unit -> (raw_item, string) Biocaml_transform.t
val raw_to_item :
unit ->
(raw_item, (item, [> Error.raw_to_item ]) Core.Result.t)
Biocaml_transform.t
val item_to_raw :
unit ->
(item, (raw_item, Error.item_to_raw) Core.Result.t)
Biocaml_transform.t
end
val raw_alignment_of_sexp : Sexplib.Sexp.t -> raw_alignment
val sexp_of_raw_alignment : raw_alignment -> Sexplib.Sexp.t
val raw_item_of_sexp : Sexplib.Sexp.t -> raw_item
val raw_item_of_sexp__ : Sexplib.Sexp.t -> raw_item
val sexp_of_raw_item : raw_item -> Sexplib.Sexp.t
val reference_sequence_of_sexp : Sexplib.Sexp.t -> reference_sequence
val sexp_of_reference_sequence : reference_sequence -> Sexplib.Sexp.t
val cigar_op_of_sexp : Sexplib.Sexp.t -> cigar_op
val cigar_op_of_sexp__ : Sexplib.Sexp.t -> cigar_op
val sexp_of_cigar_op : cigar_op -> Sexplib.Sexp.t
val optional_content_value_of_sexp :
Sexplib.Sexp.t -> optional_content_value
val optional_content_value_of_sexp__ :
Sexplib.Sexp.t -> optional_content_value
val sexp_of_optional_content_value :
optional_content_value -> Sexplib.Sexp.t
val optional_content_of_sexp : Sexplib.Sexp.t -> optional_content
val sexp_of_optional_content : optional_content -> Sexplib.Sexp.t
val alignment_of_sexp : Sexplib.Sexp.t -> alignment
val sexp_of_alignment : alignment -> Sexplib.Sexp.t
val item_of_sexp : Sexplib.Sexp.t -> item
val item_of_sexp__ : Sexplib.Sexp.t -> item
val sexp_of_item : item -> Sexplib.Sexp.t
end