/usr/lib/ocaml/sexplib/pre_sexp.ml is in libsexplib-camlp4-dev 109.20.00-2.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 | (* Sexp: Module for handling S-expressions (I/O, etc.) *)
open Format
open Bigarray
include Type
exception Of_sexp_error of exn * t
type bigstring = (char, int8_unsigned_elt, c_layout) Array1.t
(* Default indentation level for human-readable conversions *)
let default_indent = ref 1
(* Escaping of strings used as atoms in S-expressions *)
let must_escape str =
let len = String.length str in
len = 0 ||
let rec loop ix =
match str.[ix] with
| '"' | '(' | ')' | ';' | '\\' -> true
| '|' -> ix > 0 && let next = ix - 1 in str.[next] = '#' || loop next
| '#' -> ix > 0 && let next = ix - 1 in str.[next] = '|' || loop next
| c -> c <= ' ' || ix > 0 && loop (ix - 1)
in
loop (len - 1)
let maybe_esc_str str =
if must_escape str then
let estr = String.escaped str in
let elen = String.length estr in
let res = String.create (elen + 2) in
String.blit estr 0 res 1 elen;
res.[0] <- '"';
res.[elen + 1] <- '"';
res
else str
let pp_maybe_esc_str ppf str = pp_print_string ppf (maybe_esc_str str)
(* Output of S-expressions to formatters *)
let rec pp_hum_indent indent ppf = function
| Atom str -> pp_maybe_esc_str ppf str
| List (h :: t) ->
pp_open_box ppf indent;
pp_print_string ppf "(";
pp_hum_indent indent ppf h;
pp_hum_rest indent ppf t
| List [] -> pp_print_string ppf "()"
and pp_hum_rest indent ppf = function
| h :: t ->
pp_print_space ppf ();
pp_hum_indent indent ppf h;
pp_hum_rest indent ppf t
| [] ->
pp_print_string ppf ")";
pp_close_box ppf ()
let rec pp_mach_internal may_need_space ppf = function
| Atom str ->
let str' = maybe_esc_str str in
let new_may_need_space = str' == str in
if may_need_space && new_may_need_space then pp_print_string ppf " ";
pp_print_string ppf str';
new_may_need_space
| List (h :: t) ->
pp_print_string ppf "(";
let may_need_space = pp_mach_internal false ppf h in
pp_mach_rest may_need_space ppf t;
false
| List [] -> pp_print_string ppf "()"; false
and pp_mach_rest may_need_space ppf = function
| h :: t ->
let may_need_space = pp_mach_internal may_need_space ppf h in
pp_mach_rest may_need_space ppf t
| [] -> pp_print_string ppf ")"
let pp_hum ppf sexp = pp_hum_indent !default_indent ppf sexp
let pp_mach ppf sexp = ignore (pp_mach_internal false ppf sexp)
let pp = pp_mach
(* Sexp size *)
let rec size_loop (v, c as acc) = function
| Atom str -> v + 1, c + String.length str
| List lst -> List.fold_left size_loop acc lst
let size sexp = size_loop (0, 0) sexp
(* Buffer conversions *)
let to_buffer_hum ~buf ?(indent = !default_indent) sexp =
Format.bprintf buf "%a@?" (pp_hum_indent indent) sexp
let to_buffer_mach ~buf sexp =
let rec loop may_need_space = function
| Atom str ->
let str' = maybe_esc_str str in
let new_may_need_space = str' == str in
if may_need_space && new_may_need_space then Buffer.add_char buf ' ';
Buffer.add_string buf str';
new_may_need_space
| List (h :: t) ->
Buffer.add_char buf '(';
let may_need_space = loop false h in
loop_rest may_need_space t;
false
| List [] -> Buffer.add_string buf "()"; false
and loop_rest may_need_space = function
| h :: t ->
let may_need_space = loop may_need_space h in
loop_rest may_need_space t
| [] -> Buffer.add_char buf ')' in
ignore (loop false sexp)
let to_buffer = to_buffer_mach
let to_buffer_gen ~buf ~add_char ~add_string sexp =
let rec loop may_need_space = function
| Atom str ->
let str' = maybe_esc_str str in
let new_may_need_space = str' == str in
if may_need_space && new_may_need_space then add_char buf ' ';
add_string buf str';
new_may_need_space
| List (h :: t) ->
add_char buf '(';
let may_need_space = loop false h in
loop_rest may_need_space t;
false
| List [] -> add_string buf "()"; false
and loop_rest may_need_space = function
| h :: t ->
let may_need_space = loop may_need_space h in
loop_rest may_need_space t
| [] -> add_char buf ')' in
ignore (loop false sexp)
(* Output of S-expressions to I/O-channels *)
(* The maximum size of a thing on the minor heap is 256 words.
Previously, this size of the returned buffer here was 4096 bytes, which
caused the Buffer to be allocated on the *major* heap every time.
According to a simple benchmark by Ron, we can improve performance for
small s-expressions by a factor of ~4 if we only allocate 1024 bytes
(128 words + some small overhead) worth of buffer initially. And one
can argue that if it's free to allocate strings smaller than 256 words,
large s-expressions requiring larger expensive buffers won't notice
the extra two doublings from 1024 bytes to 2048 and 4096. And especially
performance-sensitive applications to always pass in a larger buffer to
use. *)
let buffer () = Buffer.create 1024
let with_new_buffer oc f =
let buf = buffer () in
f buf;
Buffer.output_buffer oc buf
let output_hum oc sexp =
with_new_buffer oc (fun buf -> to_buffer_hum sexp ~buf)
let output_hum_indent indent oc sexp =
with_new_buffer oc (fun buf -> to_buffer_hum ~indent sexp ~buf)
let output_mach oc sexp =
with_new_buffer oc (fun buf -> to_buffer_mach sexp ~buf)
let output = output_mach
(* Output of S-expressions to file *)
(* The temp file functions in the OCaml Filename module do not support
permissions. But opening a file with given permissions is different
from opening it and chmoding it to these permissions, because the umask
is taken in account. Under Unix there's no easy way to get the umask in
a thread-safe way. *)
module Tmp_file = struct
let prng = ref None
let temp_file_name prefix suffix =
let rand_state = match !prng with
| Some v -> v
| None ->
let ret = Random.State.make_self_init () in
prng := Some ret;
ret
in
let rnd = (Random.State.bits rand_state) land 0xFFFFFF in
Printf.sprintf "%s%06x%s" prefix rnd suffix
(* Keep the permissions loose. Sexps are usually shared and rarely private*)
let open_temp_file ?(perm = 0o666) prefix suffix =
let rec try_name counter =
let name = temp_file_name prefix suffix in
try
let oc =
open_out_gen [Open_wronly; Open_creat; Open_excl; Open_text] perm name
in
name, oc
with Sys_error _ as e ->
if counter >= 1000 then raise e else try_name (counter + 1)
in
try_name 0
end
let save_of_output ?perm output_function file sexp =
let tmp_name, oc = Tmp_file.open_temp_file ?perm file "tmp" in
begin
try
output_function oc sexp;
close_out oc;
with e ->
close_out_noerr oc;
begin try Sys.remove tmp_name with _ -> () end;
raise e
end;
Sys.rename tmp_name file
let output_sexp_nl do_output oc sexp =
do_output oc sexp;
output_string oc "\n"
let save_hum ?perm file sexp =
save_of_output ?perm (output_sexp_nl output_hum) file sexp
let save_mach ?perm file sexp = save_of_output ?perm output_mach file sexp
let save = save_mach
let output_sexps_nl do_output oc sexps =
List.iter (output_sexp_nl do_output oc) sexps
let save_sexps_hum ?perm file sexps =
save_of_output ?perm (output_sexps_nl output_hum) file sexps
let save_sexps_mach ?perm file sexps =
save_of_output ?perm (output_sexps_nl output_mach) file sexps
let save_sexps = save_sexps_mach
(* String conversions *)
let to_string_hum ?indent = function
| Atom str -> maybe_esc_str str
| sexp ->
let buf = buffer () in
to_buffer_hum ?indent sexp ~buf;
Buffer.contents buf
let to_string_mach = function
| Atom str -> maybe_esc_str str
| sexp ->
let buf = buffer () in
to_buffer_mach sexp ~buf;
Buffer.contents buf
let to_string = to_string_mach
(* Scan functions *)
let scan_sexp ?buf lexbuf = Parser.sexp (Lexer.main ?buf) lexbuf
let scan_sexp_opt ?buf lexbuf = Parser.sexp_opt (Lexer.main ?buf) lexbuf
let scan_sexps ?buf lexbuf = Parser.sexps (Lexer.main ?buf) lexbuf
let scan_rev_sexps ?buf lexbuf = Parser.rev_sexps (Lexer.main ?buf) lexbuf
let get_main_buf buf =
let buf =
match buf with
| None -> Buffer.create 128
| Some buf -> buf in
Lexer.main ~buf
let scan_fold_sexps ?buf ~f ~init lexbuf =
let main = get_main_buf buf in
let rec loop acc =
match Parser.sexp_opt main lexbuf with
| None -> acc
| Some sexp -> loop (f acc sexp) in
loop init
let scan_iter_sexps ?buf ~f lexbuf =
scan_fold_sexps ?buf lexbuf ~init:() ~f:(fun () sexp -> f sexp)
let scan_sexps_conv ?buf ~f lexbuf =
let coll acc sexp = f sexp :: acc in
List.rev (scan_fold_sexps ?buf ~f:coll ~init:[] lexbuf)
(* Partial parsing *)
module Annot = struct
type pos = { line : int; col : int; offset : int }
type range = { start_pos : pos; end_pos : pos }
type t = Atom of range * Type.t | List of range * t list * Type.t
type 'a conv = [ `Result of 'a | `Error of exn * t ]
exception Conv_exn of string * exn
type stack = {
mutable positions : pos list;
mutable stack : t list list;
}
let get_sexp = function Atom (_, sexp) | List (_, _, sexp) -> sexp
let get_range = function Atom (range, _) | List (range, _, _) -> range
exception Annot_sexp of t
let find_sexp annot_sexp sexp =
let rec loop annot_sexp =
match annot_sexp with
| Atom (_, sub_sexp)
| List (_, _, sub_sexp) when sexp == sub_sexp ->
raise (Annot_sexp annot_sexp)
| List (_, annots, _) -> List.iter loop annots
| Atom _ -> ()
in
try loop annot_sexp; None
with Annot_sexp res -> Some res
end
module Parse_pos = struct
type t =
{
mutable text_line : int;
mutable text_char : int;
mutable global_offset : int;
mutable buf_pos : int;
}
let create
?(text_line = 1) ?(text_char = 0)
?(buf_pos = 0) ?(global_offset = 0) () =
let fail msg = failwith ("Sexplib.Sexp.Parse_pos.create: " ^ msg) in
if text_line < 1 then fail "text_line < 1"
else if text_char < 0 then fail "text_char < 0"
else if global_offset < 0 then fail "global_offset < 0"
else if buf_pos < 0 then fail "buf_pos < 0"
else { text_line; text_char; global_offset; buf_pos }
let with_buf_pos t buf_pos = { t with buf_pos }
end
module Cont_state = struct
type t =
| Parsing_whitespace
| Parsing_atom
| Parsing_list
| Parsing_sexp_comment
| Parsing_block_comment
let to_string = function
| Parsing_whitespace -> "Parsing_whitespace"
| Parsing_atom -> "Parsing_atom"
| Parsing_list -> "Parsing_list"
| Parsing_sexp_comment -> "Parsing_sexp_comment"
| Parsing_block_comment -> "Parsing_block_comment"
end
type ('a, 't) parse_result =
| Done of 't * Parse_pos.t
| Cont of Cont_state.t * ('a, 't) parse_fun
and ('a, 't) parse_fun = pos : int -> len : int -> 'a -> ('a, 't) parse_result
type 't parse_state =
{
parse_pos : Parse_pos.t;
mutable pstack : 't;
pbuf : Buffer.t;
}
type parse_error =
{
location : string;
err_msg : string;
parse_state :
[
| `Sexp of t list list parse_state
| `Annot of Annot.stack parse_state
]
}
exception Parse_error of parse_error
let bump_text_line { parse_pos; _ } =
parse_pos.Parse_pos.text_line <- parse_pos.Parse_pos.text_line + 1;
parse_pos.Parse_pos.text_char <- 0
let bump_text_pos { parse_pos; _ } =
parse_pos.Parse_pos.text_char <- parse_pos.Parse_pos.text_char + 1
let bump_pos_cont state str ~max_pos ~pos cont =
bump_text_pos state;
cont state str ~max_pos ~pos:(pos + 1)
let bump_line_cont state str ~max_pos ~pos cont =
bump_text_line state;
cont state str ~max_pos ~pos:(pos + 1)
let add_bump bump state str ~max_pos ~pos c cont =
Buffer.add_char state.pbuf c;
bump state;
cont state str ~max_pos ~pos:(pos + 1)
let add_bump_pos state str ~max_pos ~pos c cont =
add_bump bump_text_pos state str ~max_pos ~pos c cont
let add_bump_line state str ~max_pos ~pos c cont =
add_bump bump_text_line state str ~max_pos ~pos c cont
let set_parse_pos parse_pos buf_pos =
let len = buf_pos - parse_pos.Parse_pos.buf_pos in
parse_pos.Parse_pos.buf_pos <- buf_pos;
parse_pos.Parse_pos.global_offset <- parse_pos.Parse_pos.global_offset + len
let mk_parse_pos { parse_pos; _ } buf_pos =
set_parse_pos parse_pos buf_pos;
parse_pos
let raise_parse_error parse_state location buf_pos err_msg =
match parse_state with
| `Sexp { parse_pos; _ } | `Annot { parse_pos; _ } ->
set_parse_pos parse_pos buf_pos;
let parse_error = { location; err_msg; parse_state } in
raise (Parse_error parse_error)
let raise_unexpected_char parse_state location buf_pos c =
let err_msg = sprintf "unexpected character: '%c'" c in
raise_parse_error parse_state location buf_pos err_msg
let mk_cont_parser cont_parse = (); fun _state str ~max_pos ~pos ->
let len = max_pos - pos + 1 in
cont_parse ~pos ~len str
(* Macro for generating parsers *)
#define MK_PARSER( \
TYPE, GET_LEN, PARSE, GET_CHAR, \
GET_PSTACK, SET_PSTACK, \
REGISTER_POS, REGISTER_POS1, \
MK_ATOM, MK_LIST, INIT_PSTACK, MK_PARSE_STATE) \
let bump_found_atom bump state str ~max_pos ~pos cont = \
let pbuf = state.pbuf in \
let pbuf_str = Buffer.contents pbuf in \
let atom = MK_ATOM in \
match GET_PSTACK with \
| [] -> Done (atom, mk_parse_pos state pos) \
| rev_sexp_lst :: sexp_stack -> \
Buffer.clear pbuf; \
let pstack = (atom :: rev_sexp_lst) :: sexp_stack in \
SET_PSTACK; \
bump state; \
cont state str ~max_pos ~pos:(pos + 1) \
\
let check_str_bounds loc ~pos ~len (str : TYPE) = \
if pos < 0 then invalid_arg (loc ^ ": pos < 0"); \
if len < 0 then invalid_arg (loc ^ ": len < 0"); \
let str_len = GET_LEN str in \
let pos_len = pos + len in \
if pos_len > str_len then invalid_arg (loc ^ ": pos + len > str_len"); \
pos_len - 1 \
\
let mk_cont_state name cont state ~cont_state = \
let parse_fun = \
let used_ref = ref false in \
fun ~pos ~len str -> \
if !used_ref then \
failwith "Sexplib.Sexp: parser continuation called twice" \
else begin \
used_ref := true; \
let max_pos = check_str_bounds name ~pos ~len str in \
cont state str ~max_pos ~pos \
end \
in \
Cont (cont_state, parse_fun) \
\
let mk_cont name cont state = \
let cont_state = \
match GET_PSTACK = [], Buffer.length state.pbuf = 0 with \
| true, true -> Cont_state.Parsing_whitespace \
| false, true -> Cont_state.Parsing_list \
| _, false -> Cont_state.Parsing_atom \
in \
mk_cont_state name cont state ~cont_state \
\
let rec PARSE state str ~max_pos ~pos = \
if pos > max_pos then mk_cont "parse" PARSE state \
else \
match GET_CHAR with \
| '(' -> \
REGISTER_POS \
let pstack = [] :: GET_PSTACK in \
SET_PSTACK; \
bump_pos_cont state str ~max_pos ~pos PARSE \
| ')' as c -> \
(match GET_PSTACK with \
| [] -> raise_unexpected_char (MK_PARSE_STATE state) "parse" pos c \
| rev_sexp_lst :: sexp_stack -> \
let sexp_lst = List.rev rev_sexp_lst in \
let sexp = MK_LIST in \
match sexp_stack with \
| [] -> Done (sexp, mk_parse_pos state (pos + 1)) \
| higher_rev_sexp_lst :: higher_sexp_stack -> \
let pstack = \
(sexp :: higher_rev_sexp_lst) :: higher_sexp_stack \
in \
SET_PSTACK; \
bump_pos_cont state str ~max_pos ~pos PARSE) \
| ' ' | '\009' | '\012' -> bump_pos_cont state str ~max_pos ~pos PARSE \
| '\010' -> bump_line_cont state str ~max_pos ~pos PARSE \
| '\013' -> bump_pos_cont state str ~max_pos ~pos parse_nl \
| ';' -> bump_pos_cont state str ~max_pos ~pos parse_comment \
| '"' -> \
REGISTER_POS1 \
bump_pos_cont state str ~max_pos ~pos parse_quoted \
| c -> \
REGISTER_POS \
let parse = \
match c with \
| '#' -> maybe_parse_comment \
| '|' -> maybe_parse_close_comment \
| _ -> parse_atom \
in \
add_bump_pos state str ~max_pos ~pos c parse \
\
and parse_nl state str ~max_pos ~pos = \
if pos > max_pos then mk_cont "parse_nl" parse_nl state \
else \
let c = GET_CHAR in \
if c = '\010' then bump_line_cont state str ~max_pos ~pos PARSE \
else raise_unexpected_char (MK_PARSE_STATE state) "parse_nl" pos c \
\
and parse_comment state str ~max_pos ~pos = \
if pos > max_pos then mk_cont "parse_comment" parse_comment state \
else \
match GET_CHAR with \
| '\010' -> bump_line_cont state str ~max_pos ~pos PARSE \
| '\013' -> bump_pos_cont state str ~max_pos ~pos parse_nl \
| _ -> bump_pos_cont state str ~max_pos ~pos parse_comment \
\
and maybe_parse_comment state str ~max_pos ~pos = \
if pos > max_pos then \
mk_cont "maybe_parse_comment" maybe_parse_comment state \
else \
match GET_CHAR with \
| ';' -> bump_pos_cont state str ~max_pos ~pos parse_sexp_comment \
| '|' -> bump_pos_cont state str ~max_pos ~pos parse_block_comment \
| _ -> parse_atom state str ~max_pos ~pos \
\
and maybe_parse_close_comment state str ~max_pos ~pos = \
if pos > max_pos then \
mk_cont "maybe_parse_close_comment" maybe_parse_close_comment state \
else \
if GET_CHAR <> '#' then parse_atom state str ~max_pos ~pos \
else \
let err_msg = "end of block comment without start" in \
raise_parse_error (MK_PARSE_STATE state) \
"maybe_parse_close_comment" pos err_msg \
\
and parse_sexp_comment state str ~max_pos ~pos = \
let pbuf_str = "" in \
ignore (MK_ATOM); \
Buffer.clear state.pbuf; \
let old_pstack = GET_PSTACK in \
let pstack = [] in \
SET_PSTACK; \
let rec loop parse state str ~max_pos ~pos = \
match parse state str ~max_pos ~pos with \
| Done (_sexp, { Parse_pos.buf_pos = pos; _ }) -> \
Buffer.clear state.pbuf; \
let pstack = old_pstack in \
SET_PSTACK; \
PARSE state str ~max_pos ~pos \
| Cont (_, cont_parse) -> \
Buffer.clear state.pbuf; \
let parse = mk_cont_parser cont_parse in \
mk_cont_state "parse_sexp_comment" (loop parse) state \
~cont_state:Cont_state.Parsing_sexp_comment \
in \
loop PARSE state str ~max_pos ~pos \
\
and parse_block_comment state str ~max_pos ~pos = \
let pbuf_str = "" in \
ignore (MK_ATOM); \
Buffer.clear state.pbuf; \
let old_pstack = GET_PSTACK in \
let pstack = [] in \
SET_PSTACK; \
let rec loop depth state str ~max_pos ~pos = \
let rec parse_block_depth state str ~max_pos ~pos = \
if pos > max_pos then \
mk_cont "parse_block_depth" parse_block_depth state \
else \
match GET_CHAR with \
| '\010' -> bump_line_cont state str ~max_pos ~pos parse_block_depth \
| '"' -> \
REGISTER_POS1 \
let rec parse_block_quote parse state str ~max_pos ~pos = \
match parse state str ~max_pos ~pos with \
| Done (_sexp, { Parse_pos.buf_pos = pos; _ }) -> \
Buffer.clear state.pbuf; \
parse_block_depth state str ~max_pos ~pos \
| Cont (_, cont_parse) -> \
Buffer.clear state.pbuf; \
let parse = mk_cont_parser cont_parse in \
mk_cont_state "parse_block_quote" \
(parse_block_quote parse) state \
~cont_state:Cont_state.Parsing_block_comment \
in \
bump_pos_cont state str ~max_pos ~pos \
(parse_block_quote parse_quoted) \
| '#' -> bump_pos_cont state str ~max_pos ~pos parse_open_block \
| '|' -> bump_pos_cont state str ~max_pos ~pos parse_close_block \
| _ -> bump_pos_cont state str ~max_pos ~pos parse_block_depth \
and parse_open_block state str ~max_pos ~pos = \
if pos > max_pos then \
mk_cont "parse_open_block" parse_open_block state \
else \
if GET_CHAR = '|' then \
bump_pos_cont state str ~max_pos ~pos (loop (depth + 1)) \
else parse_block_depth state str ~max_pos ~pos \
and parse_close_block state str ~max_pos ~pos = \
if pos > max_pos then \
mk_cont "parse_close_block" parse_close_block state \
else if GET_CHAR = '#' then \
let parse = \
if depth = 1 then \
let () = Buffer.clear state.pbuf in \
let pstack = old_pstack in \
SET_PSTACK; \
PARSE \
else loop (depth - 1) \
in \
bump_pos_cont state str ~max_pos ~pos parse \
else parse_block_depth state str ~max_pos ~pos \
in \
parse_block_depth state str ~max_pos ~pos \
in \
loop 1 state str ~max_pos ~pos \
\
and parse_atom state str ~max_pos ~pos = \
if pos > max_pos then mk_cont "parse_atom" parse_atom state \
else \
match GET_CHAR with \
| ' ' | '\009' | '\012' -> \
bump_found_atom bump_text_pos state str ~max_pos ~pos PARSE \
| '#' as c -> \
add_bump_pos state str ~max_pos ~pos c maybe_parse_bad_atom_hash \
| '|' as c -> \
add_bump_pos state str ~max_pos ~pos c maybe_parse_bad_atom_pipe \
| '(' -> \
let pbuf = state.pbuf in \
let pbuf_str = Buffer.contents pbuf in \
let atom = MK_ATOM in \
(match GET_PSTACK with \
| [] -> Done (atom, mk_parse_pos state pos) \
| rev_sexp_lst :: sexp_stack -> \
REGISTER_POS \
Buffer.clear pbuf; \
let pstack = [] :: (atom :: rev_sexp_lst) :: sexp_stack in \
SET_PSTACK; \
bump_pos_cont state str ~max_pos ~pos PARSE) \
| ')' -> \
let pbuf = state.pbuf in \
let pbuf_str = Buffer.contents pbuf in \
let atom = MK_ATOM in \
(match GET_PSTACK with \
| [] -> Done (atom, mk_parse_pos state pos) \
| rev_sexp_lst :: sexp_stack -> \
let sexp_lst = List.rev_append rev_sexp_lst [atom] in \
let sexp = MK_LIST in \
match sexp_stack with \
| [] -> Done (sexp, mk_parse_pos state (pos + 1)) \
| higher_rev_sexp_lst :: higher_sexp_stack -> \
Buffer.clear pbuf; \
let pstack = \
(sexp :: higher_rev_sexp_lst) :: higher_sexp_stack \
in \
SET_PSTACK; \
bump_pos_cont state str ~max_pos ~pos PARSE) \
| '\010' -> bump_found_atom bump_text_line state str ~max_pos ~pos PARSE \
| '\013' -> \
bump_found_atom bump_text_pos state str ~max_pos ~pos parse_nl \
| ';' -> \
bump_found_atom bump_text_pos state str ~max_pos ~pos parse_comment \
| '"' -> \
bump_found_atom \
bump_text_pos state str ~max_pos ~pos reg_parse_quoted \
| c -> add_bump_pos state str ~max_pos ~pos c parse_atom \
\
and maybe_parse_bad_atom_pipe state str ~max_pos ~pos = \
if pos > max_pos then \
mk_cont "maybe_parse_bad_atom_pipe" maybe_parse_bad_atom_pipe state \
else \
match GET_CHAR with \
| '#' -> \
let err_msg = "illegal end of block comment in unquoted atom" in \
raise_parse_error (MK_PARSE_STATE state) "maybe_parse_bad_atom_pipe" \
pos err_msg \
| _ -> parse_atom state str ~max_pos ~pos \
\
and maybe_parse_bad_atom_hash state str ~max_pos ~pos = \
if pos > max_pos then \
mk_cont "maybe_parse_bad_atom_hash" maybe_parse_bad_atom_hash state \
else \
match GET_CHAR with \
| '|' -> \
let err_msg = "illegal start of block comment in unquoted atom" in \
raise_parse_error (MK_PARSE_STATE state) "maybe_parse_bad_atom_hash" \
pos err_msg \
| _ -> parse_atom state str ~max_pos ~pos \
\
and reg_parse_quoted state str ~max_pos ~pos = \
REGISTER_POS \
parse_quoted state str ~max_pos ~pos \
\
and parse_quoted state str ~max_pos ~pos = \
if pos > max_pos then mk_cont "parse_quoted" parse_quoted state \
else \
match GET_CHAR with \
| '"' -> \
let pbuf = state.pbuf in \
let pbuf_str = Buffer.contents pbuf in \
let atom = MK_ATOM in \
(match GET_PSTACK with \
| [] -> Done (atom, mk_parse_pos state (pos + 1)) \
| rev_sexp_lst :: sexp_stack -> \
Buffer.clear pbuf; \
let pstack = (atom :: rev_sexp_lst) :: sexp_stack in \
SET_PSTACK; \
bump_pos_cont state str ~max_pos ~pos PARSE) \
| '\\' -> bump_pos_cont state str ~max_pos ~pos parse_escaped \
| '\010' as c -> add_bump_line state str ~max_pos ~pos c parse_quoted \
| c -> add_bump_pos state str ~max_pos ~pos c parse_quoted \
\
and parse_escaped state str ~max_pos ~pos = \
if pos > max_pos then mk_cont "parse_escaped" parse_escaped state \
else \
match GET_CHAR with \
| '\010' -> bump_line_cont state str ~max_pos ~pos parse_skip_ws \
| '\013' -> bump_pos_cont state str ~max_pos ~pos parse_skip_ws_nl \
| '0' .. '9' as c -> \
bump_text_pos state; \
let d = Char.code c - 48 in \
parse_dec state str ~max_pos ~pos:(pos + 1) ~count:2 ~d \
| 'x' -> \
bump_text_pos state; \
parse_hex state str ~max_pos ~pos:(pos + 1) ~count:2 ~d:0 \
| ('\\' | '"' | '\'' ) as c -> \
add_bump_pos state str ~max_pos ~pos c parse_quoted \
| 'n' -> add_bump_pos state str ~max_pos ~pos '\n' parse_quoted \
| 't' -> add_bump_pos state str ~max_pos ~pos '\t' parse_quoted \
| 'b' -> add_bump_pos state str ~max_pos ~pos '\b' parse_quoted \
| 'r' -> add_bump_pos state str ~max_pos ~pos '\r' parse_quoted \
| c -> \
Buffer.add_char state.pbuf '\\'; \
add_bump_pos state str ~max_pos ~pos c parse_quoted \
\
and parse_skip_ws state str ~max_pos ~pos = \
if pos > max_pos then mk_cont "parse_skip_ws" parse_skip_ws state \
else \
match GET_CHAR with \
| ' ' | '\009' -> bump_pos_cont state str ~max_pos ~pos parse_skip_ws \
| _ -> parse_quoted state str ~max_pos ~pos \
\
and parse_skip_ws_nl state str ~max_pos ~pos = \
if pos > max_pos then mk_cont "parse_skip_ws_nl" parse_skip_ws_nl state \
else \
if GET_CHAR = '\010' then \
bump_line_cont state str ~max_pos ~pos parse_skip_ws \
else begin \
Buffer.add_char state.pbuf '\013'; \
parse_quoted state str ~max_pos ~pos \
end \
\
and parse_dec state str ~max_pos ~pos ~count ~d = \
if pos > max_pos then mk_cont "parse_dec" (parse_dec ~count ~d) state \
else \
match GET_CHAR with \
| '0' .. '9' as c -> \
let d = 10 * d + Char.code c - 48 in \
if count = 1 then \
if d > 255 then \
let err_msg = sprintf "illegal decimal escape: \\%d" d in \
raise_parse_error (MK_PARSE_STATE state) "parse_dec" pos err_msg \
else \
add_bump_pos state str ~max_pos ~pos (Char.chr d) parse_quoted \
else ( \
bump_text_pos state; \
parse_dec state str ~max_pos ~pos:(pos + 1) ~count:(count - 1) ~d) \
| c -> raise_unexpected_char (MK_PARSE_STATE state) "parse_dec" pos c \
\
and parse_hex state str ~max_pos ~pos ~count ~d = \
if pos > max_pos then mk_cont "parse_hex" (parse_hex ~count ~d) state \
else \
match GET_CHAR with \
| '0' .. '9' | 'a' .. 'f' | 'A' .. 'F' as c -> \
let corr = \
if c >= 'a' then 87 \
else if c >= 'A' then 55 \
else 48 \
in \
let d = 16 * d + Char.code c - corr in \
if count = 1 then \
if d > 255 then \
let err_msg = sprintf "illegal hexadecimal escape: \\%x" d in \
raise_parse_error (MK_PARSE_STATE state) "parse_hex" pos err_msg \
else \
add_bump_pos state str ~max_pos ~pos (Char.chr d) parse_quoted \
else ( \
bump_text_pos state; \
parse_hex state str ~max_pos ~pos:(pos + 1) ~count:(count - 1) ~d) \
| c -> raise_unexpected_char (MK_PARSE_STATE state) "parse_hex" pos c \
\
let PARSE ?(parse_pos = Parse_pos.create ()) ?len str = \
let pos = parse_pos.Parse_pos.buf_pos in \
let len = \
match len with \
| Some len -> len \
| None -> GET_LEN str - pos \
in \
let max_pos = check_str_bounds "parse" ~pos ~len str in \
let state = \
{ \
parse_pos; \
pstack = INIT_PSTACK; \
pbuf = Buffer.create 128; \
} \
in \
PARSE state str ~max_pos ~pos
MK_PARSER(
string, String.length, parse_str, str.[pos],
state.pstack, state.pstack <- pstack,
,,
Atom pbuf_str, List sexp_lst, [], `Sexp
)
let parse = parse_str
(* Annot parsers *)
let get_glob_ofs parse_pos pos =
parse_pos.Parse_pos.global_offset + pos - parse_pos.Parse_pos.buf_pos
let mk_annot_pos
({ Parse_pos.text_line = line; text_char = col; _ } as parse_pos) pos =
{ Annot.line; col; offset = get_glob_ofs parse_pos pos }
let mk_annot_pos1
({ Parse_pos.text_line = line; text_char = col; _ } as parse_pos) pos =
{ Annot.line; col = col + 1; offset = get_glob_ofs parse_pos pos }
let add_annot_pos { parse_pos; pstack; pbuf = _ } pos =
pstack.Annot.positions <- mk_annot_pos parse_pos pos :: pstack.Annot.positions
let add_annot_pos1 { parse_pos; pstack; pbuf = _ } pos =
pstack.Annot.positions <-
mk_annot_pos1 parse_pos pos :: pstack.Annot.positions
let get_annot_range { parse_pos; pstack; pbuf = _ } pos =
let start_pos =
match pstack.Annot.positions with
| [] -> assert false (* impossible *)
| h :: t -> pstack.Annot.positions <- t; h
in
let end_pos =
{
Annot.
line = parse_pos.Parse_pos.text_line;
col = parse_pos.Parse_pos.text_char;
offset = get_glob_ofs parse_pos pos;
}
in
{ Annot.start_pos; end_pos }
let mk_annot_atom parse_state str pos =
Annot.Atom (get_annot_range parse_state pos, Atom str)
let mk_annot_list parse_state annot_lst pos =
let range = get_annot_range parse_state pos in
let sexp = List (List.rev (List.rev_map Annot.get_sexp annot_lst)) in
Annot.List (range, annot_lst, sexp)
let init_annot_pstate () = { Annot.positions = []; stack = [] }
MK_PARSER(
string, String.length, parse_str_annot, str.[pos],
state.pstack.Annot.stack, state.pstack.Annot.stack <- pstack,
add_annot_pos state pos;,add_annot_pos1 state pos;,
mk_annot_atom state pbuf_str pos, mk_annot_list state sexp_lst pos,
init_annot_pstate (), `Annot
)
(* Partial parsing from bigstrings *)
(* NOTE: this is really an awful duplication of the code for parsing
strings, but since OCaml does not inline higher-order functions known
at compile, other solutions would sacrifice a lot of efficiency. *)
MK_PARSER(
bigstring, Array1.dim, parse_bigstring, str.{pos},
state.pstack, state.pstack <- pstack,
,,
Atom pbuf_str, List sexp_lst, [], `Sexp
)
MK_PARSER(
bigstring, Array1.dim, parse_bigstring_annot, str.{pos},
state.pstack.Annot.stack, state.pstack.Annot.stack <- pstack,
add_annot_pos state pos;,add_annot_pos1 state pos;,
mk_annot_atom state pbuf_str pos, mk_annot_list state sexp_lst pos,
init_annot_pstate (), `Annot
)
(* Input functions *)
let mk_this_parse ?parse_pos my_parse = (); fun ~pos ~len str ->
let parse_pos =
match parse_pos with
| None -> Parse_pos.create ~buf_pos:pos ()
| Some parse_pos -> parse_pos.Parse_pos.buf_pos <- pos; parse_pos
in
my_parse ?parse_pos:(Some parse_pos) ?len:(Some len) str
let gen_input_sexp my_parse ?parse_pos ic =
let buf = String.create 1 in
let rec loop this_parse =
let c = input_char ic in
buf.[0] <- c;
match this_parse ~pos:0 ~len:1 buf with
| Done (sexp, _) -> sexp
| Cont (_, this_parse) -> loop this_parse
in
loop (mk_this_parse ?parse_pos my_parse)
let input_sexp ?parse_pos ic = gen_input_sexp parse ?parse_pos ic
let gen_input_rev_sexps my_parse ?parse_pos ?(buf = String.create 8192) ic =
let rev_sexps_ref = ref [] in
let buf_len = String.length buf in
let rec loop this_parse ~pos ~len ~cont_state =
if len > 0 then
match this_parse ~pos ~len buf with
| Done (sexp, ({ Parse_pos.buf_pos; _ } as parse_pos)) ->
rev_sexps_ref := sexp :: !rev_sexps_ref;
let n_parsed = buf_pos - pos in
let this_parse = mk_this_parse ~parse_pos my_parse in
let cont_state = Cont_state.Parsing_whitespace in
if n_parsed = len then
let new_len = input ic buf 0 buf_len in
loop this_parse ~pos:0 ~len:new_len ~cont_state
else loop this_parse ~pos:buf_pos ~len:(len - n_parsed) ~cont_state
| Cont (cont_state, this_parse) ->
loop this_parse ~pos:0 ~len:(input ic buf 0 buf_len) ~cont_state
else
if cont_state = Cont_state.Parsing_whitespace then !rev_sexps_ref
else
failwith (
"Sexplib.Sexp.input_rev_sexps: reached EOF while in state "
^ Cont_state.to_string cont_state)
in
let len = input ic buf 0 buf_len in
let this_parse = mk_this_parse ?parse_pos my_parse in
loop this_parse ~pos:0 ~len ~cont_state:Cont_state.Parsing_whitespace
let input_rev_sexps ?parse_pos ?buf ic =
gen_input_rev_sexps parse ?parse_pos ?buf ic
let input_sexps ?parse_pos ?buf ic =
List.rev (input_rev_sexps ?parse_pos ?buf ic)
(* of_string and of_bigstring *)
let of_string_bigstring loc this_parse ws_buf get_len get_sub str =
match this_parse str with
| Done (_, { Parse_pos.buf_pos; _ }) when buf_pos <> get_len str ->
let prefix_len = min (get_len str - buf_pos) 20 in
let prefix = get_sub str buf_pos prefix_len in
let msg =
sprintf
"Sexplib.Sexp.%s: S-expression followed by data at position %d: %S..."
loc buf_pos prefix
in
failwith msg
| Done (sexp, _) -> sexp
| Cont (_, this_parse) ->
(* When parsing atoms, the incremental parser cannot tell whether
it is at the end until it hits whitespace. We therefore feed it
one space to determine whether it is finished. *)
match this_parse ~pos:0 ~len:1 ws_buf with
| Done (sexp, _) -> sexp
| Cont (cont_state, _) ->
let cont_state_str = Cont_state.to_string cont_state in
failwith (
sprintf
"Sexplib.Sexp.%s: incomplete S-expression while in state %s: %s"
loc cont_state_str (get_sub str 0 (get_len str)))
let of_string str =
of_string_bigstring "of_string" parse " " String.length String.sub str
let get_bstr_sub_str bstr pos len =
let str = String.create len in
for i = 0 to len - 1 do str.[i] <- bstr.{pos + i} done;
str
let bstr_ws_buf = Array1.create char c_layout 1
let () = bstr_ws_buf.{0} <- ' '
let of_bigstring bstr =
of_string_bigstring
"of_bigstring" parse_bigstring bstr_ws_buf Array1.dim get_bstr_sub_str bstr
(* Loading *)
let gen_load_rev_sexps input_rev_sexps ?buf file =
let ic = open_in file in
try
let sexps = input_rev_sexps ?parse_pos:None ?buf ic in
close_in ic;
sexps
with exc -> close_in_noerr ic; raise exc
let load_rev_sexps ?buf file = gen_load_rev_sexps input_rev_sexps ?buf file
let load_sexps ?buf file = List.rev (load_rev_sexps ?buf file)
let gen_load_sexp_loc = "Sexplib.Sexp.gen_load_sexp"
let gen_load_sexp my_parse ?(strict = true) ?(buf = String.create 8192) file =
let buf_len = String.length buf in
let ic = open_in file in
let rec loop this_parse ~cont_state =
let len = input ic buf 0 buf_len in
if len = 0 then
failwith (
sprintf "%s: EOF in %s while in state %s"
gen_load_sexp_loc file (Cont_state.to_string cont_state))
else
match this_parse ~pos:0 ~len buf with
| Done (sexp, ({ Parse_pos.buf_pos; _ } as parse_pos)) when strict ->
let rec strict_loop this_parse ~pos ~len =
match this_parse ~pos ~len buf with
| Done _ ->
failwith (
sprintf "%s: more than one S-expression in file %s"
gen_load_sexp_loc file)
| Cont (cont_state, this_parse) ->
let len = input ic buf 0 buf_len in
if len > 0 then strict_loop this_parse ~pos:0 ~len
else if cont_state = Cont_state.Parsing_whitespace then sexp
else
failwith (
sprintf "%s: %s in state %s loading file %s"
gen_load_sexp_loc "additional incomplete data"
(Cont_state.to_string cont_state) file)
in
let this_parse = mk_this_parse ~parse_pos my_parse in
strict_loop this_parse ~pos:buf_pos ~len:(len - buf_pos)
| Done (sexp, _) -> sexp
| Cont (cont_state, this_parse) -> loop this_parse ~cont_state
in
try
let sexp =
loop (mk_this_parse my_parse) ~cont_state:Cont_state.Parsing_whitespace
in
close_in ic;
sexp
with exc -> close_in_noerr ic; raise exc
let load_sexp ?strict ?buf file = gen_load_sexp parse ?strict ?buf file
module Annotated = struct
include Annot
let parse = parse_str_annot
let parse_bigstring = parse_bigstring_annot
let input_rev_sexps ?parse_pos ?buf ic =
gen_input_rev_sexps parse ?parse_pos ?buf ic
let input_sexp ?parse_pos ic = gen_input_sexp parse ?parse_pos ic
let input_sexps ?parse_pos ?buf ic =
List.rev (input_rev_sexps ?parse_pos ?buf ic)
let of_string str =
of_string_bigstring
"Annotated.of_string" parse " " String.length String.sub str
let of_bigstring bstr =
of_string_bigstring
"Annotated.of_bigstring"
parse_bigstring bstr_ws_buf Array1.dim get_bstr_sub_str bstr
let load_rev_sexps ?buf file = gen_load_rev_sexps input_rev_sexps ?buf file
let load_sexps ?buf file = List.rev (load_rev_sexps ?buf file)
let load_sexp ?strict ?buf file = gen_load_sexp parse ?strict ?buf file
let conv f annot_sexp =
let sexp = get_sexp annot_sexp in
try `Result (f sexp)
with Of_sexp_error (exc, bad_sexp) as e ->
match find_sexp annot_sexp bad_sexp with
| None -> raise e
| Some bad_annot_sexp -> `Error (exc, bad_annot_sexp)
let get_conv_exn ~file ~exc annot_sexp =
let range = get_range annot_sexp in
let { start_pos = { line; col; offset = _ }; end_pos = _ } = range in
let loc = sprintf "%s:%d:%d" file line col in
Of_sexp_error (Annot.Conv_exn (loc, exc), get_sexp annot_sexp)
end
let load_sexp_conv ?(strict = true) ?(buf = String.create 8192) file f =
let sexp = load_sexp ~strict ~buf file in
try `Result (f sexp)
with Of_sexp_error _ ->
Annotated.conv f (Annotated.load_sexp ~strict ~buf file)
let raise_conv_exn ~file = function
| `Result res -> res
| `Error (exc, annot_sexp) ->
raise (Annotated.get_conv_exn ~file ~exc annot_sexp)
let load_sexp_conv_exn ?strict ?buf file f =
raise_conv_exn ~file (load_sexp_conv ?strict ?buf file f)
let load_sexps_conv ?(buf = String.create 8192) file f =
let rev_sexps = load_rev_sexps ~buf file in
try List.rev_map (fun sexp -> `Result (f sexp)) rev_sexps
with Of_sexp_error _ as e ->
match Annotated.load_rev_sexps ~buf file with
| [] ->
(* File is now empty - perhaps it was a temporary file handle? *)
raise e
| rev_annot_sexps ->
List.rev_map (fun annot_sexp -> Annotated.conv f annot_sexp)
rev_annot_sexps
let load_sexps_conv_exn ?(buf = String.create 8192) file f =
let rev_sexps = load_rev_sexps ~buf file in
try List.rev_map f rev_sexps
with Of_sexp_error _ as e ->
match Annotated.load_rev_sexps ~buf file with
| [] ->
(* File is now empty - perhaps it was a temporary file handle? *)
raise e
| rev_annot_sexps ->
List.rev_map
(fun annot_sexp -> raise_conv_exn ~file (Annotated.conv f annot_sexp))
rev_annot_sexps
let gen_of_string_conv of_string annot_of_string str f =
let sexp = of_string str in
try `Result (f sexp)
with Of_sexp_error _ -> Annotated.conv f (annot_of_string str)
let of_string_conv str f =
gen_of_string_conv of_string Annotated.of_string str f
let of_bigstring_conv bstr f =
gen_of_string_conv of_bigstring Annotated.of_bigstring bstr f
module Of_string_conv_exn = struct
type t = { exc : exn; sexp : Type.t; sub_sexp : Type.t }
exception E of t
end
let gen_of_string_conv_exn of_string str f =
let sexp = of_string str in
try f sexp
with Of_sexp_error (exc, sub_sexp) ->
raise (Of_string_conv_exn.E { Of_string_conv_exn.exc; sexp; sub_sexp })
let of_string_conv_exn str f = gen_of_string_conv_exn of_string str f
let of_bigstring_conv_exn bstr f = gen_of_string_conv_exn of_bigstring bstr f
(* Utilities for automated type conversions *)
let unit = List []
external sexp_of_t : t -> t = "%identity"
external t_of_sexp : t -> t = "%identity"
(* Utilities for conversion error handling *)
type found = [ `Found | `Pos of int * found ]
type search_result = [ `Not_found | found ]
let rec search_physical sexp ~contained =
if sexp == contained then `Found
else
match sexp with
| Atom _ -> `Not_found
| List lst ->
let rec loop i = function
| [] -> `Not_found
| h :: t ->
let res = search_physical h ~contained in
match res with
| `Not_found -> loop (i + 1) t
| #found as found -> `Pos (i, found)
in
loop 0 lst
let rec subst_found sexp ~subst = function
| `Found -> subst
| `Pos (pos, found) ->
match sexp with
| Atom _ ->
failwith "Sexplib.Sexp.subst_found: atom when position requested"
| List lst ->
let rec loop acc pos = function
| [] ->
failwith
"Sexplib.Sexp.subst_found: short list when position requested"
| h :: t when pos <> 0 -> loop (h :: acc) (pos - 1) t
| h :: t ->
List (List.rev_append acc (subst_found h ~subst found :: t))
in
loop [] pos lst
|