ENIAMlexSemanticsStringOf.ml
3.54 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
(*
* ENIAMlexSemantics is a library that assigns tokens with lexicosemantic information.
* Copyright (C) 2016-2017 Wojciech Jaworski <wjaworski atSPAMfree mimuw dot edu dot pl>
* Copyright (C) 2016-2017 Institute of Computer Science Polish Academy of Sciences
*
* This library is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*)
open ENIAMlexSemanticsTypes
open Printf
(*let lex_sem t = "not implemented"
let lex_sems t =
String.concat "\n" (List.rev (Int.fold 0 (ExtArray.size t - 1) [] (fun l id ->
let t2 = ExtArray.get t id in
(Printf.sprintf "%3d %s" id (lex_sem t2)) :: l)))*)
let arole f =
(if f.arole = "" then "" else "," ^ f.arole) ^
(if f.arole_attr = "" then "" else "," ^ f.arole_attr) ^
(if f.arev then ",rev" else "")
let string_of_lex_sems tokens lex_sems =
String.concat "\n" (List.rev (Int.fold 0 (ExtArray.size lex_sems - 1) [] (fun l id ->
let t = ExtArray.get lex_sems id in
let t2 = ExtArray.get tokens id in
let orth = t2.ENIAMtokenizerTypes.orth in
let lemma = ENIAMtokens.string_of_token t2.ENIAMtokenizerTypes.token in
let core = Printf.sprintf "%3d %s %s" id orth lemma in
let lex_entries = Xlist.map t.lex_entries (fun (selectors,s) ->
"&[" ^ ENIAMcategoriesPL.string_of_selectors selectors ^ "] " ^ ENIAM_LCGstringOf.grammar_symbol 0 s) in
let schemata = Xlist.map t.schemata (fun (selectors,l) ->
"[" ^ ENIAMcategoriesPL.string_of_selectors selectors ^ "] {" ^ String.concat "," (Xlist.map l (fun (d,s) ->
ENIAM_LCGstringOf.direction d ^ ENIAM_LCGstringOf.grammar_symbol 0 s)) ^ "}") in
(* let frames = Xlist.map t.frames (fun (selectors,meanings,schema) ->
"*[" ^ ENIAMcategoriesPL.string_of_selectors selectors ^ "] {" ^ ENIAMwalStringOf.schema schema ^ "} " ^
String.concat "," (Xlist.map meanings (fun m -> ENIAMwalStringOf.meaning m))) in
let senses = Xlist.map t.senses (fun (sense,hipero,weight) ->
Printf.sprintf "%s[%s]%.2f" sense (String.concat "," (Xlist.map hipero (fun (s,n) -> s ^ " " ^ string_of_int n))) weight) in*)
let frames = Xlist.map t.frames (fun f ->
"*" ^ arole f ^ "[" ^ ENIAMcategoriesPL.string_of_selectors f.selectors ^ "] {" ^ ENIAMwalStringOf.schema f.positions ^ "} " ^
String.concat "," (Xlist.map f.meanings (fun (sense,hipero,weight) ->
Printf.sprintf "%s[%s]%.2f" sense (String.concat "," (Xlist.map hipero (fun (s,n) -> s ^ " " ^ string_of_int n))) weight))) in
(String.concat "\n " ([core] @ (*senses @*) schemata @ frames @ lex_entries)) :: l)))
(* let lroles = if snd t.lroles = "" then fst t.lroles else fst t.lroles ^ " " ^ snd t.lroles in
let core = Printf.sprintf "%3d %s %s %s" id orth lemma lroles in
let valence = Xlist.map t.valence (ENIAMwalStringOf.fnum_frame "") in
let simple_valence = Xlist.map t.simple_valence (ENIAMwalStringOf.fnum_frame "") in
(* let semantics = *)
(String.concat "\n " ([core] @ senses @ valence @ simple_valence)) :: l))) *)