parsowanie przetworzonego Walentego

Wojciech Jaworski
1 parent ae919ded
Showing 15 changed files with 1139 additions and 1224 deletions
walenty/.gitignore
walenty/ENIAMwalConnect.ml
walenty/ENIAMwalFrames.ml
walenty/ENIAMwalGenerate.ml
walenty/ENIAMwalLex.ml
walenty/ENIAMwalParser.ml
walenty/ENIAMwalRealizations.ml
walenty/ENIAMwalReduce.ml
walenty/ENIAMwalStringOf.ml
walenty/ENIAMwalTEI.ml
walenty/ENIAMwalTypes.ml
walenty/ENIAMwalTypes2.ml
walenty/entries.ml
walenty/makefile
walenty/test.ml
 loader
+test
@@ -18,17 +18,7 @@
  *)
  
 open Xstd
-open ENIAMwalTypes
-
-(* let process_morfs = function
-    MorfId id -> id
-  | _ -> failwith "process_morfs"
-
-let process_positions positions =
-  Xlist.fold positions IntMap.empty (fun positions position ->
-    let r,cr,ce = ENIAMwalParser.parse_roles (position.gf :: position.control) in
-    let phrases = List.rev (Xlist.rev_map position.morfs process_morfs) in
-    IntMap.add positions position.psn_id (r,cr,ce,phrases)) *)
+open ENIAMwalTypes2
  
 let process_morfs morfs =
   Xlist.fold morfs IntMap.empty (fun morfs -> function
@@ -41,19 +31,18 @@ let process_positions positions =
  
 let process_schemata schemata =
   Xlist.fold schemata IntMap.empty (fun schemata schema ->
-    let schema_atrs = DefaultAtrs([],schema.reflexiveMark,
-      schema.opinion, schema.negativity, schema.predicativity, schema.aspect) in
+    let atrs = schema.negativity, schema.predicativity, schema.aspect in
     let positions = process_positions schema.positions in
-    IntMap.add schemata schema.sch_id (schema_atrs,positions))
+    IntMap.add schemata schema.sch_id (schema.reflexiveMark,schema.opinion,atrs,positions))
  
 let process_arguments arguments =
   Xlist.fold arguments IntMap.empty (fun arguments argument ->
     IntMap.add arguments argument.arg_id argument)
  
-let process_frames frames = (* FIXME: pomijam opinię *)
+let process_frames frames =
   Xlist.fold frames IntMap.empty (fun frames frame ->
       let arguments = process_arguments frame.arguments in
-      IntMap.add frames frame.frm_id (frame.meanings,arguments))
+      IntMap.add frames frame.frm_id (frame,arguments))
  
 let process_meanings meanings =
   Xlist.fold meanings IntMap.empty (fun meanings meaning ->
@@ -67,18 +56,15 @@ let process_sel_pref arguments = function
     RelationRole(s,arg.role,arg.role_attribute)
   | RelationRole _ -> failwith "process_sel_pref"
  
-let add_meanings meanings = function
-    DefaultAtrs(_,r,o,n,p,a) -> DefaultAtrs(meanings,r,o,n,p,a)
-  | _ -> failwith "add_meanings"
-
 let connect entry =
   let schemata = process_schemata entry.schemata in
   let frames = process_frames entry.frames in
   let meanings = process_meanings entry.meanings in
   Xlist.fold entry.alternations [] (fun found alt ->
-    let schema_atrs,positions = IntMap.find schemata alt.schema in
-    let meaning_ids,arguments = IntMap.find frames alt.frame in
-    let conn_positions = Xlist.fold alt.connections [] (fun conn_positions conn ->
+    let refl,opinion,schema_atrs,positions = IntMap.find schemata alt.schema in
+    let frame,arguments = IntMap.find frames alt.frame in
+    let conn_positions = if refl then [ENIAMwalTEI.refl_position] else [] in
+    let conn_positions = Xlist.fold alt.connections conn_positions (fun conn_positions conn ->
       let arg = IntMap.find arguments conn.argument in
       let sel_prefs = Xlist.map arg.sel_prefs (process_sel_pref arguments) in
       Xlist.fold conn.phrases conn_positions (fun conn_positions (position_id,phrase_ids) ->
@@ -89,191 +75,13 @@ let connect entry =
               with Not_found -> Printf.printf "%s\n%!" entry.form_orth;morfs) in
           {position with role=arg.role; role_attr=arg.role_attribute; sel_prefs=sel_prefs;
                          morfs=List.rev morfs} :: conn_positions)) in
-    let meanings = List.rev (Xlist.rev_map meaning_ids (fun id ->
+    let meanings = List.rev (Xlist.rev_map frame.meanings (fun id ->
           IntMap.find meanings id)) in
-    let schema_atrs = add_meanings meanings schema_atrs in
-    (Frame(schema_atrs,conn_positions)) :: found)
+    (opinion,frame.opinion,meanings,schema_atrs,conn_positions) :: found)
  
 let schemata entry =
   let schemata = process_schemata entry.schemata in
-  IntMap.fold schemata [] (fun found _ (schema_atrs,positions) ->
+  IntMap.fold schemata [] (fun found _ (refl,opinion,schema_atrs,positions) ->
       let positions = IntMap.fold positions [] (fun positions _ position -> position :: positions) in
-      (Frame(schema_atrs,positions)) :: found)
-
-(* Test wczytywania *)
-(* let _ =
-  let n = Xlist.fold ENIAMwalTEI.walenty 0 (fun n e -> let l = connect e in n + Xlist.size l) in
-  let m = Xlist.fold ENIAMwalTEI.walenty 0 (fun n e -> let l = schemata e in n + Xlist.size l) in
-  Printf.printf "%d connected\n%d schemata\n" n m;
-  () *)
-
-let connected_walenty =
-  Xlist.fold ENIAMwalTEI.walenty StringMap.empty (fun pos_map e ->
-      let orth_map = try StringMap.find pos_map e.form_pos with Not_found -> StringMap.empty in
-      let frames = connect e in
-      let orth_map = StringMap.add_inc orth_map e.form_orth frames (fun l -> frames @ l) in
-      StringMap.add pos_map e.form_pos orth_map)
-
-let schemata_walenty =
-  Xlist.fold ENIAMwalTEI.walenty StringMap.empty (fun pos_map e ->
-      let orth_map = try StringMap.find pos_map e.form_pos with Not_found -> StringMap.empty in
-      let frames = schemata e in
-      let orth_map = StringMap.add_inc orth_map e.form_orth frames (fun l -> frames @ l) in
-      StringMap.add pos_map e.form_pos orth_map)
-
-let insert_phrases phrases = function
-    Frame(atrs,s) -> Frame(atrs,Xlist.map s (fun p ->
-      {p with morfs=Xlist.map p.morfs (function
-             MorfId id -> (try IntMap.find phrases id with Not_found -> failwith "insert_phrases")
-           | _ -> failwith "insert_phrases")}))
-  | _ -> failwith "insert_phrases: ni"
-
-let print_entry pos_map pos orth =
-  let orth_map = try StringMap.find pos_map pos with Not_found -> StringMap.empty in
-  let frames = try StringMap.find orth_map orth with Not_found -> [] in
-  Xlist.iter frames (fun frame ->
-      let frame = insert_phrases ENIAMwalTEI.phrases frame in
-      print_endline (ENIAMwalStringOf.frame orth frame))
-
-(* Wypisanie hasła *)
-(* let _ =
-  print_entry connected_walenty "verb" "brudzić";
-  () *)
-
-let has_nontrivial_lex = function
-    Frame(atrs,s) -> Xlist.fold s false (fun b p ->
-      if p.role = "Lemma" && p.role_attr = "" then b else
-      Xlist.fold p.morfs b (fun b -> function
-            MorfId id -> failwith "has_nontrivial_lex"
-          | LexPhrase _ -> true
-          (* | LexRPhrase _ -> true
-          | LexPhraseMode _ -> true *)
-          | _ -> b))
-  | _ -> failwith "has_nontrivial_lex: ni"
-
-(* Leksykalizacje nie wchodzące do lematu *)
-(* let _ =
-  StringMap.iter connected_walenty (fun _ orth_map ->
-      StringMap.iter orth_map (fun orth frames ->
-          Xlist.iter frames (fun frame ->
-              let frame = insert_phrases ENIAMwalTEI.phrases frame in
-              if has_nontrivial_lex frame then
-                print_endline (ENIAMwalStringOf.frame orth frame)))) *)
-
-let simplify_frame_verb = function
-    Phrase(NP(Case "dat")) -> []
-  | Phrase(NP(Case "inst")) -> []
-  | Phrase(PrepNP _) -> []
-  | Phrase(ComprepNP _) -> []
-  | Phrase(AdvP) -> []
-  | t -> [t]
-
-let simplify_frame_noun = function
-    Phrase(NP(Case "gen")) -> []
-  | Phrase(NP(Case "nom")) -> []
-  | Phrase(NP(CaseAgr)) -> []
-  | Phrase(PrepNP _) -> []
-  | Phrase(ComprepNP _) -> []
-  | Phrase(AdjP CaseAgr) -> []
-  | PhraseComp(Ncp(Case "gen"),_)
-  | PhraseComp(Prepncp(_,_),_) -> []
-  | PhraseAbbr(Possp,[]) -> []
-  | t -> [t]
-
-let simplify_frame_adj = function
-  | t -> [t]
-
-let simplify_frame_adv = function
-  | t -> [t]
-
-
-let simplify_frame pos = function
-    Frame(atrs,s) ->
-    let schema = Xlist.fold s [] (fun schema p ->
-        let morfs = Xlist.fold p.morfs [] (fun morfs morf ->
-            match pos with
-              "verb" -> simplify_frame_verb morf @ morfs
-            | "noun" -> simplify_frame_noun morf @ morfs
-            | "adj" -> simplify_frame_adj morf @ morfs
-            | "adv" -> simplify_frame_adv morf @ morfs
-            | _ -> failwith "simplify_frame") in
-        if morfs = [] then schema else
-          {p with ce=[]; cr=[]; morfs=morfs} :: schema) in
-    if schema = [] then [] else [Frame(atrs,schema)]
-  | _ -> failwith "simplify_frame: ni"
-
-
-(* Uproszczone schematy *)
-(* let _ =
-  StringMap.iter schemata_walenty (fun pos orth_map ->
-      if pos = "noun" then
-      StringMap.iter orth_map (fun orth frames ->
-          Xlist.iter frames (fun frame ->
-              let frame = insert_phrases ENIAMwalTEI.phrases frame in
-              let frames = simplify_frame pos frame in
-              Xlist.iter frames (fun frame -> print_endline (ENIAMwalStringOf.frame orth frame))))) *)
-
-let has_mode_coordination = function
-    Frame(atrs,s) -> Xlist.fold s false (fun b p ->
-      let n = Xlist.fold p.morfs 0 (fun n -> function
-              MorfId id -> failwith "has_nontrivial_lex"
-            | PhraseAbbr(Advp _,_) -> n+1
-            | PhraseAbbr(Xp _,_) -> n+1
-            (* | LexPhraseMode _ -> n+1 FIXME*)
-            | _ -> n) in
-      if n>1 then true else b)
-  | _ -> failwith "has_nontrivial_lex: ni"
-
-(* Koordynacja z mode *)
-(* let _ =
-  StringMap.iter schemata_walenty(*connected_walenty*) (fun _ orth_map ->
-      StringMap.iter orth_map (fun orth frames ->
-          Xlist.iter frames (fun frame ->
-              let frame = insert_phrases ENIAMwalTEI.phrases frame in
-              if has_mode_coordination frame then
-                print_endline (ENIAMwalStringOf.frame orth frame)))) *)
-
-
-(* let get_entry orth pos *)
-     (*
-let load_walenty2 () =
-  let walenty = load_walenty walenty_filename in
-  Xlist.fold walenty StringMap.empty (fun walenty entry ->
-    if entry.frames = [] then Xlist.fold (connect2 entry) walenty (fun walenty (lemma,pos,frame) ->
-      let map = try StringMap.find walenty pos with Not_found -> StringMap.empty in
-      let map = StringMap.add_inc map lemma [frame] (fun l -> frame :: l) in
-      StringMap.add walenty pos map)
-    else Xlist.fold (connect entry) walenty (fun walenty (lemma,pos,frame) ->
-      let map = try StringMap.find walenty pos with Not_found -> StringMap.empty in
-      let map = StringMap.add_inc map lemma [frame] (fun l -> frame :: l) in
-      StringMap.add walenty pos map))
-
-
-let print_stringqmap filename qmap =
-  let l = StringQMap.fold qmap [] (fun l k v -> (v,k) :: l) in
-  File.file_out filename (fun file ->
-    Xlist.iter (Xlist.sort l compare) (fun (v,k) ->
-      Printf.fprintf file "%5d %s\n" v k))
-
-let sel_prefs_quantities walenty =
-  Xlist.fold walenty StringQMap.empty (fun quant e ->
-    Xlist.fold e.frames quant (fun quant f ->
-      Xlist.fold f.arguments quant (fun quant a ->
-        Xlist.fold a.sel_prefs quant (fun quant l ->
-          Xlist.fold l quant (fun quant -> function
-              Numeric s ->
-                let name = try ENIAMplWordnet.synset_name s with Not_found -> "unknown" in
-                StringQMap.add quant ("N " ^ s ^ " " ^ name)
-            | Symbol s -> StringQMap.add quant ("S " ^ s)
-            | Relation(s,t) -> StringQMap.add quant ("R " ^ s ^ " | " ^ t))))))
-*)
-(*let _ =
-  let walenty = load_walenty walenty_filename in
-  let quant = sel_prefs_quantities walenty in
-  print_stringqmap "results/quant_sel_prefs.txt" quant*)
-
-(*let _ =
-  let walenty = load_walenty2 () in
-  let frames_sem = try StringMap.find (StringMap.find walenty "verb") "bębnić" with Not_found -> failwith "walTEI" in
-  Xlist.iter frames_sem (fun frame ->
-    print_endline (WalStringOf.frame "bębnić" frame))*)
+      let positions = if refl then ENIAMwalTEI.refl_position :: positions else positions in
+      (opinion,schema_atrs,positions) :: found)
@@ -217,35 +217,6 @@ and assign_role_and_sense_morfs morfs =
     | LexPhraseMode(_,pos_lex,(restr,schema)) -> [LexPhrase(pos_lex,(restr,assign_role_and_sense schema))]
     | _ -> failwith "assign_role_and_sense_morfs"))
  
-let rec assign_pro_args schema =
-  Xlist.map schema (fun s ->
-    let morfs = match s.morfs with
-      (E p) :: l -> E Pro :: (E p) :: l
-    | [LexPhrase _] as morfs -> morfs
-    | [Phrase(FixedP _)] as morfs -> morfs
-    | [Phrase(Lex _)] as morfs -> morfs
-(*    | [Phrase Refl] as morfs -> morfs
-    | [Phrase Recip] as morfs -> morfs*)
-    | Phrase Null :: _ as morfs -> morfs
-    | Phrase Pro :: _ as morfs -> morfs
-    | morfs -> if s.gf <> SUBJ && s.cr = [] && s.ce = [] then (Phrase Null) :: morfs else (Phrase Pro) :: morfs in (* FIXME: ustalić czy są inne przypadki uzgodnienia *)
-(*     let morfs = assign_pro_args_lex morfs in *) (* bez pro wewnątrz leksykalizacji *)
-    {s with morfs=morfs})
-
-(*let assign_pro_args_lex morfs =
-  Xlist.map morfs (function
-      Lex(morf,specs,lex,restr) -> LexN(morf,specs,lex,assign_pro_args_restr restr)
-    | LexNum(morf,lex1,lex2,restr) -> LexNum(morf,lex1,lex2,assign_pro_args_restr restr)
-    | LexCompar(morf,l) -> LexCompar(morf,make_gfs_lex l)
-    | morf -> morf)
-
-and assign_pro_args_restr = function
-    Natr -> Natr
-  | Ratr1 schema -> Ratr1(assign_pro_args schema)
-  | Atr1 schema -> Atr1(assign_pro_args schema)
-  | Ratr schema -> Ratr(assign_pro_args schema)
-  | Atr schema -> Atr(assign_pro_args schema)*)
-
 (*let _ =
   Xlist.iter walenty_filenames (fun filename ->
     print_endline filename;
@@ -258,92 +229,6 @@ and assign_pro_args_restr = function
         ignore (process_aspect [Text aspect]);
         ignore (assign_pro_args (make_gfs (process_schema expands subtypes equivs schema))))))*)
  
-exception ImpossibleSchema
-
-let rec reduce_comp lexemes = function
-    Comp s -> if StringMap.mem lexemes s then Comp s else raise Not_found
-  | Zeby -> if StringMap.mem lexemes "żeby" || StringMap.mem lexemes "że" then Zeby else raise Not_found
-  | Gdy -> if StringMap.mem lexemes "gdy" || StringMap.mem lexemes "gdyby" then Gdy else raise Not_found
-  | CompUndef -> failwith "reduce_comp"
-
-let reduce_phrase lexemes = function
-  | PrepNP(_,prep,case) as phrase -> if StringMap.mem lexemes prep then phrase else raise Not_found
-  | PrepAdjP(_,prep,case) as phrase -> if StringMap.mem lexemes prep then phrase else raise Not_found
-  | PrepNumP(_,prep,case) as phrase -> if StringMap.mem lexemes prep then phrase else raise Not_found
-  | ComprepNP(_,prep) as phrase  -> if Xlist.fold (try StringMap.find comprep_reqs prep with Not_found -> []) true (fun b s -> b && StringMap.mem lexemes s) then phrase else raise Not_found
-  | ComparNP(_,prep,case) as phrase  -> if StringMap.mem lexemes prep then phrase else raise Not_found
-  | ComparPP(_,prep) as phrase  -> if StringMap.mem lexemes prep then phrase else raise Not_found
-  | CP(ctype,comp) -> CP(ctype,reduce_comp lexemes comp)
-  | NCP(case,ctype,comp) -> if StringMap.mem lexemes "to" then NCP(case,ctype,reduce_comp lexemes comp) else raise Not_found
-  | PrepNCP(sem,prep,case,ctype,comp) -> if StringMap.mem lexemes prep && StringMap.mem lexemes "to" then PrepNCP(sem,prep,case,ctype,reduce_comp lexemes comp) else raise Not_found
-  | phrase -> phrase
-
-let rec reduce_lex lexemes = function
-    Lexeme s -> if StringMap.mem lexemes s then Lexeme s else raise Not_found
-  | ORconcat l ->
-      let l = List.rev (Xlist.fold l [] (fun l lex -> try reduce_lex lexemes lex :: l with Not_found -> l)) in
-      (match l with
-          [] -> raise Not_found
-        | [x] -> x
-        | l -> ORconcat l)
-  | ORcoord l ->
-      let l = List.rev (Xlist.fold l [] (fun l lex -> try reduce_lex lexemes lex :: l with Not_found -> l)) in
-      (match l with
-          [] -> raise Not_found
-        | [x] -> x
-        | l -> ORcoord l)
-  | XOR l ->
-      let l = List.rev (Xlist.fold l [] (fun l lex -> try reduce_lex lexemes lex :: l with Not_found -> l)) in
-      (match l with
-          [] -> raise Not_found
-        | [x] -> x
-        | l -> XOR l)
-  | Elexeme gender -> Elexeme gender
-
-let rec reduce_restr lexemes = function   (* leksykalizacje wewnątrz leksykalizacji są w niektórych sytuacjach opcjonalne *)
-    Natr,[] -> Natr,[]
-  | Atr,[] -> Atr,[]
-  | Ratr,[] -> Ratr,[]
-  | Atr1,[] -> Atr1,[]
-  | Ratr1,[] -> Ratr1,[]
-  | Ratr1,schema -> let schema = reduce_schema2 lexemes schema in if schema = [] then raise Not_found else Ratr1,schema
-  | Atr1,schema -> let schema = reduce_schema2 lexemes schema in if schema = [] then Natr,[] else Atr1,schema
-  | Ratr,schema -> let schema = reduce_schema2 lexemes schema in if schema = [] then raise Not_found else Ratr,schema
-  | Atr,schema -> let schema = reduce_schema2 lexemes schema in if schema = [] then Natr,[] else Atr,schema
-  | Ratrs,schema -> Ratrs,reduce_schema lexemes schema
-  | _ -> failwith "reduce_restr"
-
-and reduce_morf lexemes = function (* leksykalizacje, które się z czymś koordynują nie są obowiązakowe *)
-    Phrase phrase -> Phrase(reduce_phrase lexemes phrase)
-  | E phrases -> E phrases (* FIXME: uproszczenie *)
-  | LexPhrase(pos_lex,restr) -> LexPhrase(Xlist.map pos_lex (fun (pos,lex) -> pos, reduce_lex lexemes lex),reduce_restr lexemes restr)
-  | morf -> failwith ("reduce_morf: " ^ ENIAMwalStringOf.morf morf)
-
-and reduce_morfs lexemes = function
-    [] -> []
-  | morf :: l -> (try [reduce_morf lexemes morf] with Not_found -> []) @ reduce_morfs lexemes l
-
-and reduce_schema2 lexemes = function
-    [] -> []
-  | s :: l ->
-      let morfs = reduce_morfs lexemes s.morfs in
-      if morfs = [] then reduce_schema2 lexemes l else
-      {s with morfs=morfs} :: reduce_schema2 lexemes l
-
-and reduce_schema lexemes = function
-    [] -> []
-  | s :: l ->
-      let morfs = reduce_morfs lexemes s.morfs in
-      if morfs = [] then raise ImpossibleSchema else
-      {s with morfs=morfs} :: reduce_schema lexemes l
-
-let reduce_schema_frame lexemes = function
-    Frame(atrs,schema) -> Frame(atrs,reduce_schema lexemes schema)
-(*  | ComprepFrame(s,morfs) ->
-      let morfs = reduce_morfs lexemes morfs in
-      if morfs = [] then raise ImpossibleSchema else ComprepFrame(s,morfs)*)
-  | _ -> failwith "reduce_schema_frame"
-
 let remove_trivial_args schema =
   Xlist.fold schema [] (fun l (_,_,_,morfs) ->
     let morfs = Xlist.fold morfs [] (fun morfs -> function
+(*
+ *  ENIAMwalenty, an interface for Polish Valence Dictionary "Walenty".
+ *  Copyright (C) 2016 Wojciech Jaworski <wjaworski atSPAMfree mimuw dot edu dot pl>
+ *  Copyright (C) 2016 Institute of Computer Science Polish Academy of Sciences
+ *
+ *  This library is free software: you can redistribute it and/or modify
+ *  it under the terms of the GNU Lesser General Public License as published by
+ *  the Free Software Foundation, either version 3 of the License, or
+ *  (at your option) any later version.
+ *
+ *  This library is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU Lesser General Public License for more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ *)
+
+open ENIAMwalTypes2
+open Xstd
+
+let load_walenty walenty_filename expands_filename =
+  let walenty,phrases = ENIAMwalTEI.load_walenty walenty_filename in
+  let expands = ENIAMwalTEI.load_expands expands_filename in
+  let connected_walenty =
+    Xlist.fold walenty Entries.empty (fun connected_walenty e ->
+        let entries = ENIAMwalConnect.connect e in
+        Entries.add_inc_list connected_walenty e.form_pos e.form_orth entries) in
+  let schemata_walenty =
+    Xlist.fold walenty Entries.empty (fun schemata_walenty e ->
+        let entries = ENIAMwalConnect.schemata e in
+        Entries.add_inc_list schemata_walenty e.form_pos e.form_orth entries) in
+  let expands,compreps,subtypes,equivs =
+    ENIAMwalRealizations.load_realizations (expands,ENIAMwalTEI.subtypes,ENIAMwalTEI.equivs) in
+  let phrases =
+    IntMap.map phrases (fun morf ->
+        let morf = ENIAMwalRealizations.expand_schema_morf expands morf in
+        let morfs = ENIAMwalRealizations.expand_subtypes_morf subtypes morf in
+        let morf = List.flatten (Xlist.map morfs (ENIAMwalRealizations.expand_equivs_morf equivs)) in
+        morf) in
+  let compreps = Xlist.map compreps (fun (lemma,morfs) ->
+      lemma, ENIAMwalLex.expand_lexicalizations_morfs morfs) in
+  let entries = ENIAMwalLex.extract_lex_entries_comprepnp [] compreps in
+  let phrases,entries =
+    IntMap.fold phrases (IntMap.empty,entries) (fun (phrases,entries) id morfs ->
+        let morfs = ENIAMwalLex.expand_lexicalizations_morfs morfs in
+        let morfs,entries = Xlist.fold morfs ([],entries) ENIAMwalLex.extract_lex_entries in
+        IntMap.add phrases id morfs, entries) in
+  let entries = Xlist.fold entries Entries.empty (fun entries (pos,lemma,entry) ->
+      Entries.add_inc entries pos lemma entry) in
+  let entries = Entries.map2 entries (fun pos lemma entries -> EntrySet.to_list (EntrySet.of_list entries)) in
+  let entries = Entries.flatten_map entries (fun pos lemma entry ->
+      ENIAMwalLex.expand_restr [] lemma pos entry) in
+    (* let entries =
+      StringMap.mapi entries (fun pos entries2 ->
+        StringMap.mapi entries2 (fun lemma entries3 ->
+            EntrySet.fold entries3 [] (fun entries3 entry ->
+                (ENIAMwalLex.expand_restr [] lemma pos entry) @ entries3))) in *)
+  connected_walenty, schemata_walenty, phrases, entries
+
+let print_entries filename entries =
+  File.file_out filename (fun file ->
+      Entries.iter entries (fun pos lemma entry ->
+          Printf.fprintf file "%s\t%s\t%s\n" pos lemma (ENIAMwalStringOf.lex_entry entry)))
+
+let print_phrases filename phrases =
+  File.file_out filename (fun file ->
+      IntMap.iter phrases (fun id morfs ->
+          let morfs = Xlist.map morfs ENIAMwalStringOf.morf in
+          Printf.fprintf file "%d\t%s\n" id (String.concat "\t" morfs)))
+
+let print_schemata filename schemata =
+  File.file_out filename (fun file ->
+      Entries.iter schemata (fun pos lemma (opinion,(n,p,a),schema) ->
+          Printf.fprintf file "%s\t%s\t%s\t%s\t%s\t%s\t%s\n" pos lemma
+            (ENIAMwalStringOf.opinion opinion)
+            (ENIAMwalStringOf.negation n)
+            (ENIAMwalStringOf.pred p)
+            (ENIAMwalStringOf.aspect a)
+            (ENIAMwalStringOf.simple_schema schema)))
+
+let split_tokens s =
+  let l = List.flatten (Xlist.map (Str.full_split (Str.regexp " \\|,\\|-") s) (function
+        Str.Delim " " -> []
+      | Str.Delim s -> [s]
+      | Str.Text s -> [s])) in
+  String.concat " " l
+
+let print_fixed filename fixed =
+  File.file_out filename (fun file ->
+      StringSet.iter fixed (fun s ->
+          let t = split_tokens s in
+          Printf.fprintf file "%s\t%s\tfixed\n" t s))
+
+
+let add_fixed fixed = function
+    Phrase (FixedP s) -> StringSet.add fixed s
+  | SimpleLexArg(s,FIXED) -> StringSet.add fixed s
+  | LexArg(_,s,FIXED) -> StringSet.add fixed s
+  | _ -> fixed
+
+let find_fixed_schema fixed schema =
+  Xlist.fold schema fixed (fun schema p ->
+      Xlist.fold p.morfs fixed add_fixed)
+
+let find_fixed phrases entries =
+  let fixed = IntMap.fold phrases StringSet.empty (fun fixed _ morfs ->
+      Xlist.fold morfs fixed add_fixed) in
+  Entries.fold entries fixed (fun fixed pos lemma -> function
+        SimpleLexEntry(s,"fixed") -> StringSet.add fixed s
+      | SimpleLexEntry(s,_) -> fixed
+      | LexEntry(_,s,"fixed",_,schema) -> find_fixed_schema (StringSet.add fixed s) schema
+      | LexEntry(_,_,_,_,schema) -> find_fixed_schema fixed schema
+      | ComprepNPEntry(_,_,schema) -> find_fixed_schema fixed schema)
+
+let connected_walenty, schemata_walenty, phrases, entries = load_walenty
+    "/home/yacheu/Dokumenty/NLP resources/Walenty/walenty_20170311.xml"
+    "/home/yacheu/Dokumenty/NLP resources/Walenty/phrase_types_expand_20170311.xml"
+
+(* FIXME: uporządkowanie "winien" *)
+(* Generowanie zasobów *)
+let _ =
+  print_entries "results/entries.tab" entries;
+  print_phrases "results/phrases.tab" phrases;
+  print_schemata "results/schemata.tab" schemata_walenty;
+  (* print_connected "results/connected.dic" connected_walenty); *)
+  print_fixed "results/fixed.tab" (find_fixed phrases entries);
+  ()
+
+(* Test wczytywania Walentego TEI *)
+(* let _ =
+   let walenty,phrases = ENIAMwalTEI.load_walenty "/home/yacheu/Dokumenty/NLP resources/Walenty/walenty_20170311.xml"
+   let n = Xlist.fold ENIAMwalTEI.walenty 0 (fun n e -> let l = connect e in n + Xlist.size l) in
+   let m = Xlist.fold ENIAMwalTEI.walenty 0 (fun n e -> let l = schemata e in n + Xlist.size l) in
+   Printf.printf "%d connected\n%d schemata\n|phrases|=%d\n" n m (IntMap.size phrases);
+   () *)
+
+(* let insert_phrases phrases = function
+    Frame(atrs,s) -> Frame(atrs,Xlist.map s (fun p ->
+      {p with morfs=Xlist.map p.morfs (function
+             MorfId id -> (try IntMap.find phrases id with Not_found -> failwith "insert_phrases")
+           | _ -> failwith "insert_phrases")}))
+  | _ -> failwith "insert_phrases: ni"
+
+let print_entry pos_map pos orth =
+  let orth_map = try StringMap.find pos_map pos with Not_found -> StringMap.empty in
+  let frames = try StringMap.find orth_map orth with Not_found -> [] in
+  Xlist.iter frames (fun frame ->
+      let frame = insert_phrases ENIAMwalTEI.phrases frame in
+      print_endline (ENIAMwalStringOf.frame orth frame)) *)
+
+(* Wypisanie hasła *)
+(* let _ =
+   print_entry connected_walenty "verb" "brudzić";
+   () *)
+
+(* let has_nontrivial_lex = function
+    Frame(atrs,s) -> Xlist.fold s false (fun b p ->
+      if p.role = "Lemma" && p.role_attr = "" then b else
+        Xlist.fold p.morfs b (fun b -> function
+              MorfId id -> failwith "has_nontrivial_lex"
+            | LexPhrase _ -> true
+            (* | LexRPhrase _ -> true
+               | LexPhraseMode _ -> true *)
+            | _ -> b))
+  | _ -> failwith "has_nontrivial_lex: ni" *)
+
+(* Leksykalizacje nie wchodzące do lematu *)
+(* let _ =
+   StringMap.iter connected_walenty (fun _ orth_map ->
+      StringMap.iter orth_map (fun orth frames ->
+          Xlist.iter frames (fun frame ->
+              let frame = insert_phrases ENIAMwalTEI.phrases frame in
+              if has_nontrivial_lex frame then
+                print_endline (ENIAMwalStringOf.frame orth frame)))) *)
+
+let simplify_frame_verb = function
+    Phrase(NP(Case "dat")) -> []
+  | Phrase(NP(Case "inst")) -> []
+  | Phrase(PrepNP _) -> []
+  | Phrase(ComprepNP _) -> []
+  | Phrase(AdvP) -> []
+  | t -> [t]
+
+let simplify_frame_noun = function
+    Phrase(NP(Case "gen")) -> []
+  | Phrase(NP(Case "nom")) -> []
+  | Phrase(NP(CaseAgr)) -> []
+  | Phrase(PrepNP _) -> []
+  | Phrase(ComprepNP _) -> []
+  | Phrase(AdjP CaseAgr) -> []
+  | PhraseComp(Ncp(Case "gen"),_)
+  | PhraseComp(Prepncp(_,_),_) -> []
+  | PhraseAbbr(Possp,[]) -> []
+  | t -> [t]
+
+let simplify_frame_adj = function
+  | t -> [t]
+
+let simplify_frame_adv = function
+  | t -> [t]
+
+
+(* let simplify_frame pos = function
+    Frame(atrs,s) ->
+    let schema = Xlist.fold s [] (fun schema p ->
+        let morfs = Xlist.fold p.morfs [] (fun morfs morf ->
+            match pos with
+              "verb" -> simplify_frame_verb morf @ morfs
+            | "noun" -> simplify_frame_noun morf @ morfs
+            | "adj" -> simplify_frame_adj morf @ morfs
+            | "adv" -> simplify_frame_adv morf @ morfs
+            | _ -> failwith "simplify_frame") in
+        if morfs = [] then schema else
+          {p with ce=[]; cr=[]; morfs=morfs} :: schema) in
+    if schema = [] then [] else [Frame(atrs,schema)]
+  | _ -> failwith "simplify_frame: ni" *)
+
+
+(* Uproszczone schematy *)
+(* let _ =
+   StringMap.iter schemata_walenty (fun pos orth_map ->
+      if pos = "noun" then
+      StringMap.iter orth_map (fun orth frames ->
+          Xlist.iter frames (fun frame ->
+              let frame = insert_phrases ENIAMwalTEI.phrases frame in
+              let frames = simplify_frame pos frame in
+              Xlist.iter frames (fun frame -> print_endline (ENIAMwalStringOf.frame orth frame))))) *)
+
+(* let has_mode_coordination = function
+    Frame(atrs,s) -> Xlist.fold s false (fun b p ->
+      let n = Xlist.fold p.morfs 0 (fun n -> function
+            MorfId id -> failwith "has_nontrivial_lex"
+          | PhraseAbbr(Advp _,_) -> n+1
+          | PhraseAbbr(Xp _,_) -> n+1
+          (* | LexPhraseMode _ -> n+1 FIXME*)
+          | _ -> n) in
+      if n>1 then true else b)
+  | _ -> failwith "has_nontrivial_lex: ni" *)
+
+(* Koordynacja z mode *)
+(* let _ =
+   StringMap.iter schemata_walenty(*connected_walenty*) (fun _ orth_map ->
+      StringMap.iter orth_map (fun orth frames ->
+          Xlist.iter frames (fun frame ->
+              let frame = insert_phrases ENIAMwalTEI.phrases frame in
+              if has_mode_coordination frame then
+                print_endline (ENIAMwalStringOf.frame orth frame)))) *)
+
+
+(* let get_entry orth pos *)
+     (*
+let load_walenty2 () =
+  let walenty = load_walenty walenty_filename in
+  Xlist.fold walenty StringMap.empty (fun walenty entry ->
+    if entry.frames = [] then Xlist.fold (connect2 entry) walenty (fun walenty (lemma,pos,frame) ->
+      let map = try StringMap.find walenty pos with Not_found -> StringMap.empty in
+      let map = StringMap.add_inc map lemma [frame] (fun l -> frame :: l) in
+      StringMap.add walenty pos map)
+    else Xlist.fold (connect entry) walenty (fun walenty (lemma,pos,frame) ->
+      let map = try StringMap.find walenty pos with Not_found -> StringMap.empty in
+      let map = StringMap.add_inc map lemma [frame] (fun l -> frame :: l) in
+      StringMap.add walenty pos map))
+
+
+let print_stringqmap filename qmap =
+  let l = StringQMap.fold qmap [] (fun l k v -> (v,k) :: l) in
+  File.file_out filename (fun file ->
+    Xlist.iter (Xlist.sort l compare) (fun (v,k) ->
+      Printf.fprintf file "%5d %s\n" v k))
+
+let sel_prefs_quantities walenty =
+  Xlist.fold walenty StringQMap.empty (fun quant e ->
+    Xlist.fold e.frames quant (fun quant f ->
+      Xlist.fold f.arguments quant (fun quant a ->
+        Xlist.fold a.sel_prefs quant (fun quant l ->
+          Xlist.fold l quant (fun quant -> function
+              Numeric s ->
+                let name = try ENIAMplWordnet.synset_name s with Not_found -> "unknown" in
+                StringQMap.add quant ("N " ^ s ^ " " ^ name)
+            | Symbol s -> StringQMap.add quant ("S " ^ s)
+            | Relation(s,t) -> StringQMap.add quant ("R " ^ s ^ " | " ^ t))))))
+*)
+(*let _ =
+  let walenty = load_walenty walenty_filename in
+  let quant = sel_prefs_quantities walenty in
+  print_stringqmap "results/quant_sel_prefs.txt" quant*)
+
+(*let _ =
+  let walenty = load_walenty2 () in
+  let frames_sem = try StringMap.find (StringMap.find walenty "verb") "bębnić" with Not_found -> failwith "walTEI" in
+  Xlist.iter frames_sem (fun frame ->
+    print_endline (WalStringOf.frame "bębnić" frame))*)
+
+
+(* Wypisanie realizacji *)
+(* let _ =
+   Xlist.iter ENIAMwalTEI.expands (fun (id,morf,l) ->
+      Printf.printf "%d %s:\n" id (ENIAMwalStringOf.morf morf);
+      Xlist.iter l (fun morf -> Printf.printf "    %s\n" (ENIAMwalStringOf.morf morf))) *)
+
+(* Wypisanie realizacji po przetworzeniu *)
+(* let _ =
+   AbbrMap.iter expands (fun morf l ->
+      Printf.printf "%s:\n" (ENIAMwalStringOf.phrase_abbr morf);
+      Xlist.iter l (fun morf -> Printf.printf "    %s\n" (ENIAMwalStringOf.morf morf))) *)
+
+let has_realization = function
+    PhraseAbbr _ -> true
+  | PhraseComp _ -> true
+  | _ -> false
+
+(* Wypisanie fraz, które podlegają rozwijaniu *)
+(*let _ =
+  IntMap.iter ENIAMwalTEI.phrases (fun i morf ->
+      if has_realization morf then
+      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf morf)) *)
+
+(* Wypisanie fraz, które podlegają rozwijaniu *)
+(* let _ =
+   IntMap.iter phrases (fun i morf ->
+      if has_realization morf then
+      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf morf)) *)
+
+(* let test_phrases = [17088; 17133; 1642]
+   let _ =
+   Xlist.iter test_phrases (fun i ->
+      let m1 = IntMap.find ENIAMwalTEI.phrases i in
+      let m2 = IntMap.find phrases i in
+      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf m1);
+      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf m2)) *)
+
+(* let print_entries entries =
+  StringMap.iter entries (fun pos entries2 ->
+      StringMap.iter entries2 (fun lemma entries3 ->
+          EntrySet.iter entries3 (fun entry ->
+              Printf.printf "%s: %s: %s\n" pos lemma (ENIAMwalStringOf.entry entry)))) *)
+
+(* let _ = print_entries entries *)
@@ -17,7 +17,7 @@
  *  along with this program.  If not, see <http://www.gnu.org/licenses/>.
  *)
  
-open ENIAMwalTypes
+open ENIAMwalTypes2
 open Xstd
  
 let prep_arg_schema_field morfs =
@@ -63,7 +63,8 @@ and expand_lexicalizations_morfs morfs = (* uproszczenie polegające na zezwolen
       (*      | LexPhrase([PREP _,_;ADJ _,_],(_,_::_)) -> print_endline (ENIAMwalStringOf.morf morf); [morf]
               | LexPhrase([PREP _,_;PPAS _,_],(_,_::_)) -> print_endline (ENIAMwalStringOf.morf morf); [morf]
               | LexPhrase([PREP _,_;PACT _,_],(_,_::_)) -> print_endline (ENIAMwalStringOf.morf morf); [morf] *)
-      | Phrase(PrepNumP(prep,case)) -> [LexPhrase([PREP case,Lexeme prep],(Ratrs,[prep_arg_schema_field(*2*) [Phrase(NumP(case))]]))]
+      (* | Phrase(PrepNumP(prep,case)) -> [LexPhrase([PREP case,Lexeme prep],(Ratrs,[prep_arg_schema_field(*2*) [Phrase(NumP(case))]]))] *)
+      | Phrase(PrepNumP(prep,case)) -> [Phrase(PrepNP(prep,case))] (* FIXME: celowe uproszczenie *)
       | LexPhrase([PREP pcase,plex;SUBST(n,c),slex],(Atr1,[{morfs=[LexPhrase([QUB,_],_)]} as s])) ->
         (*            print_endline (ENIAMwalStringOf.morf morf);  *)
         [LexPhrase([PREP pcase,plex],(Ratrs,[prep_arg_schema_field [LexPhrase([SUBST(n,c),slex],(Natr,[]))]]));
@@ -80,13 +81,13 @@ and expand_lexicalizations_morfs morfs = (* uproszczenie polegające na zezwolen
       | LexPhrase([PREP pcase,plex;NUM(c,g,a),nlex;pos,lex],restr) ->
         let genders,lexs = split_elexeme lex in
         Xlist.map genders (fun gender ->
-            LexPhrase([PREP pcase,plex],(Ratrs,[prep_arg_schema_field [LexPhrase([NUM(c,gender,a),nlex],(Ratrs,[(*num*)prep_arg_schema_field [Phrase Pro]]))]]))) @
+            LexPhrase([PREP pcase,plex],(Ratrs,[prep_arg_schema_field [LexPhrase([NUM(c,gender,a),nlex],(Ratrs,[(*num*)prep_arg_schema_field [Phrase Null(*Pro*)]]))]]))) @ (*FIXME*)
         Xlist.map lexs (fun lex ->
             LexPhrase([PREP pcase,plex],(Ratrs,[prep_arg_schema_field [LexPhrase([NUM(c,g,a),nlex],(Ratrs,[(*num*)prep_arg_schema_field [LexPhrase([pos,lex],restr)]]))]])))
       | LexPhrase([NUM(c,g,a),nlex;pos,lex],restr) ->
         let genders,lexs = split_elexeme lex in
         Xlist.map genders (fun gender ->
-            LexPhrase([NUM(c,gender,a),nlex],(Ratrs,[(*num*)prep_arg_schema_field [Phrase Pro]]))) @
+            LexPhrase([NUM(c,gender,a),nlex],(Ratrs,[(*num*)prep_arg_schema_field [Phrase Null(*Pro*)]]))) @
         Xlist.map lexs (fun lex ->
             LexPhrase([NUM(c,g,a),nlex],(Ratrs,[(*num*)prep_arg_schema_field [LexPhrase([pos,lex],restr)]])))
       | LexPhrase([COMP ctype,clex;pos,lex],restr) ->
@@ -157,6 +158,20 @@ let get_pos lex = function
   | COMPAR -> ["compar"]
   | COMP _ -> ["comp"]
   | FIXED -> ["fixed"]
+  | _ -> failwith "get_pos"
+
+let map_pos lemma = function
+    SUBST(number,case) ->
+    (match lemma with
+       "ja" -> PPRON12(number,case)
+     | "my" -> PPRON12(number,case)
+     | "ty" -> PPRON12(number,case)
+     | "wy" -> PPRON12(number,case)
+     | "on" -> PPRON3(number,case)
+     | "siebie" -> SIEBIE case
+     | "się" -> QUB
+     | _ -> SUBST(number,case))
+  | p -> p
  
 let lex_id_counter = ref 0
  
@@ -166,16 +181,20 @@ let get_lex_id () =
  
 (* FIXME: to trzeba będzie poprawić przy unlike coordination *)
 (* FIXME: słownik pos wywołuje redundancję *)
+(* FIXME: parametr refl z typu pos można przenieść do schematu *)
 let rec extract_lex_entries (morfs,entries) = function
     LexPhrase([pos,lex],(Natr,[])) ->
     let lexemes = get_lexemes lex in
     let entries = Xlist.fold lexemes entries (fun entries lemma ->
         Xlist.fold (get_pos lemma pos) entries (fun entries pos2 ->
+            (pos2,lemma,SimpleLexEntry(lemma,pos2)) :: entries)) in
+            (* let entries = Xlist.fold lexemes entries (fun entries lemma ->
+        Xlist.fold (get_pos lemma pos) entries (fun entries pos2 ->
             let entries2 = try StringMap.find entries pos2 with Not_found -> StringMap.empty in
             let entry = SimpleLexEntry(lemma,pos2) in
             let entries2 = StringMap.add_inc entries2 lemma (EntrySet.singleton entry) (fun set -> EntrySet.add set entry) in
-            StringMap.add entries pos2 entries2)) in
-    let morfs = Xlist.fold lexemes morfs (fun morfs lemma -> SimpleLexArg(lemma,pos) :: morfs) in
+            StringMap.add entries pos2 entries2)) in *)
+    let morfs = Xlist.fold lexemes morfs (fun morfs lemma -> SimpleLexArg(lemma,map_pos lemma pos) :: morfs) in
     morfs,entries
   | LexPhrase([pos,lex],(restr,schema)) ->
     let id = get_lex_id () in
@@ -183,11 +202,14 @@ let rec extract_lex_entries (morfs,entries) = function
     let schema,entries = extract_lex_entries_schema entries schema in
     let entries = Xlist.fold lexemes entries (fun entries lemma ->
         Xlist.fold (get_pos lemma pos) entries (fun entries pos2 ->
+            (pos2,lemma,LexEntry(id,lemma,pos2,restr,schema)) :: entries)) in
+    (* let entries = Xlist.fold lexemes entries (fun entries lemma ->
+        Xlist.fold (get_pos lemma pos) entries (fun entries pos2 ->
             let entries2 = try StringMap.find entries pos2 with Not_found -> StringMap.empty in
             let entry = LexEntry(id,lemma,pos2,restr,schema) in
             let entries2 = StringMap.add_inc entries2 lemma (EntrySet.singleton entry) (fun set -> EntrySet.add set entry) in
-            StringMap.add entries pos2 entries2)) in
-    let morfs = Xlist.fold lexemes morfs (fun morfs lemma -> LexArg(id,lemma,pos) :: morfs) in
+            StringMap.add entries pos2 entries2)) in *)
+    let morfs = Xlist.fold lexemes morfs (fun morfs lemma -> LexArg(id,lemma,map_pos lemma pos) :: morfs) in
     morfs,entries
   | LexPhrase _ as morf -> failwith ("extract_lex_entries: " ^ ENIAMwalStringOf.morf morf)
   | morf -> morf :: morfs, entries
@@ -207,35 +229,21 @@ let extract_lex_entries_comprepnp entries compreps =
             let schema,entries = extract_lex_entries_schema entries schema in
             Xlist.fold lexemes entries (fun entries lemma ->
                 Xlist.fold (get_pos lemma pos) entries (fun entries pos2 ->
+                    (pos2,lemma,ComprepNPEntry(clemma,restr,schema)) :: entries))
+            (* Xlist.fold lexemes entries (fun entries lemma ->
+                Xlist.fold (get_pos lemma pos) entries (fun entries pos2 ->
                     let entries2 = try StringMap.find entries pos2 with Not_found -> StringMap.empty in
                     let entry = ComprepNPEntry(clemma,restr,schema) in
                     let entries2 = StringMap.add_inc entries2 lemma (EntrySet.singleton entry) (fun set -> EntrySet.add set entry) in
-                    StringMap.add entries pos2 entries2))
+                    StringMap.add entries pos2 entries2)) *)
           | _ -> failwith "extract_lex_entries_comprepnp"))
  
-let phrases,entries =
-  let compreps = Xlist.map ENIAMwalRealizations.compreps (fun (lemma,morfs) ->
-      lemma, expand_lexicalizations_morfs morfs) in
-  let entries = extract_lex_entries_comprepnp StringMap.empty compreps in
-  IntMap.fold ENIAMwalRealizations.phrases (IntMap.empty,entries) (fun (phrases,entries) id morfs ->
-      let morfs = expand_lexicalizations_morfs morfs in
-      let morfs,entries = Xlist.fold morfs ([],entries) extract_lex_entries in
-      IntMap.add phrases id morfs, entries)
-
-let print_entries entries =
-  StringMap.iter entries (fun pos entries2 ->
-      StringMap.iter entries2 (fun lemma entries3 ->
-          EntrySet.iter entries3 (fun entry ->
-              Printf.printf "%s: %s: %s\n" pos lemma (ENIAMwalStringOf.entry entry))))
-
-(* let _ = print_entries entries *)
-
 let rec expand_restr valence lexeme pos = function
     SimpleLexEntry(lemma,pos2) -> [SimpleLexEntry(lemma,pos2)]
   (* | LexEntry(id,lemma,pos2,Natr,[]) -> [LexEntry(id,lemma,pos2,NoRestr,[])] *)
   | LexEntry(id,lemma,pos2,Natr,_) -> failwith "expand_restr"
   | LexEntry(id,lemma,pos2,restr,[]) ->
-    print_endline (lexeme ^ " " ^ pos);
+    (* print_endline (lexeme ^ " " ^ pos); *)
     [LexEntry(id,lemma,pos2,restr,[])] (* FIXME *)
 (*    (*       print_endline "expand_restr"; *)
     let frames = try StringMap.find (StringMap.find valence lexeme) pos
@@ -265,7 +273,7 @@ let rec expand_restr valence lexeme pos = function
   | LexEntry(id,lemma,pos2,NoRestr,_) -> failwith "expand_restr"
   (* | ComprepNPEntry(lemma,Natr,[]) -> [ComprepNPEntry(lemma,NoRestr,[])] *)
   | ComprepNPEntry(lemma,Natr,_) -> failwith "expand_restr"
-  | ComprepNPEntry(lemma,restr,[]) as entry -> failwith ("expand_restr: " ^ ENIAMwalStringOf.entry entry)
+  | ComprepNPEntry(lemma,restr,[]) as entry -> failwith ("expand_restr: " ^ ENIAMwalStringOf.lex_entry entry)
   | ComprepNPEntry(lemma,Atr,schema) ->
     let schema = Xlist.map schema (fun p -> {p with morfs=Phrase Null :: p.morfs}) in
     [ComprepNPEntry(lemma,NoRestr,schema)]
@@ -279,35 +287,4 @@ let rec expand_restr valence lexeme pos = function
     Xlist.map schema (fun x -> ComprepNPEntry(lemma,NoRestr,[x]))
   | ComprepNPEntry(lemma,Ratrs,schema) -> [ComprepNPEntry(lemma,NoRestr,schema)]
   | ComprepNPEntry(lemma,NoRestr,_) -> failwith "expand_restr"
-  (* | Frame _ as frame -> [frame] *)
-  | _ -> failwith "expand_restr"
-
-let entries =
-  StringMap.mapi entries (fun pos entries2 ->
-      StringMap.mapi entries2 (fun lemma entries3 ->
-          EntrySet.fold entries3 [] (fun entries3 entry ->
-              (expand_restr [] lemma pos entry) @ entries3)))
-
-
-(*
-let convert morfs =
-  let morfs = expand_lexicalizations_morfs morfs in
-  let morfs,frames = Xlist.fold morfs ([],[]) extract_lex_morf in
-  (*Xlist.fold frames(*extract_lex_frames lexeme pos [] frame*) valence (fun valence -> function
-        lexeme,pos,Frame(atrs,schema) ->
-        let schemas = simplify_lex (split_xor (split_or_coord schema)) in
-        Xlist.fold schemas valence (fun valence schema ->
-            let poss = try StringMap.find valence lexeme with Not_found -> StringMap.empty in
-            let poss = StringMap.add_inc poss pos [Frame(atrs,schema)] (fun l -> Frame(atrs,schema) :: l) in
-            StringMap.add valence lexeme poss)
-      | lexeme,pos,LexFrame(id,pos2,restr,schema) ->
-        let schemas = simplify_lex (split_xor (split_or_coord schema)) in
-        Xlist.fold schemas valence (fun valence schema ->
-            let poss = try StringMap.find valence lexeme with Not_found -> StringMap.empty in
-            let poss = StringMap.add_inc poss pos [LexFrame(id,pos2,restr,schema)] (fun l -> LexFrame(id,pos2,restr,schema) :: l) in
-            StringMap.add valence lexeme poss)
-      | _ -> failwith "convert_frame") *)()
-
-
-let phrases = IntMap.map ENIAMwalRealizations.phrases convert
-*)
+  (* | _ -> failwith "expand_restr" *)
@@ -18,9 +18,16 @@
  *)
  
 open ENIAMwalTypes
-
 open Xstd
  
+type token =
+    Text of string
+  | Paren of token list
+  | Bracet of token list
+  | SqBra of token list
+  | LParen | RParen | LBracet | RBracet | LSqBra | RSqBra
+  | Semic | Plus | Comma | Quot
+
 let rec find_brackets = function
     LParen :: l ->
         let found,l = find_rbracket RParen [] l in
@@ -50,6 +57,21 @@ and find_rbracket bracket rev = function
   | s :: l -> find_rbracket bracket (s :: rev) l
   | [] -> failwith "find_rbracket"
  
+let split_text schema =
+  find_brackets (Xlist.map (Str.full_split (Str.regexp "\\]\\|\\+\\|{\\|}\\|(\\|)\\|,\\|;\\|'\\|\\[") schema) (function
+      Str.Text s -> Text s
+    | Str.Delim "(" -> LParen
+    | Str.Delim ")" -> RParen
+    | Str.Delim "{" -> LBracet
+    | Str.Delim "}" -> RBracet
+    | Str.Delim "[" -> LSqBra
+    | Str.Delim "]" -> RSqBra
+    | Str.Delim ";" -> Semic
+    | Str.Delim "+" -> Plus
+    | Str.Delim "," -> Comma
+    | Str.Delim "'" -> Quot
+    | _ -> failwith "parse_text"))
+
 let rec split_symbol symb rev = function
     [] -> [List.rev rev](*failwith "split_symbol"*)
   | s :: l ->
@@ -58,56 +80,24 @@ let rec split_symbol symb rev = function
         else (List.rev rev) :: (split_symbol symb [] l)
       else split_symbol symb (s :: rev) l
  
-let parse_opinion = function
-    "pewny" -> Pewny
-  | "cer" -> Pewny
-  | "potoczny" -> Potoczny
-  | "col" -> Potoczny
-  | "wątpliwy" -> Watpliwy
-  | "unc" -> Watpliwy
-  | "archaiczny" -> Archaiczny
-  | "dat" -> Archaiczny
-  | "zły" -> Zly
-  | "bad" -> Zly
-  | "wulgarny" -> Wulgarny
-  | "vul" -> Wulgarny
-  | x -> failwith ("parse_opinion: " ^ x)
-
-let parse_roles l =
-  let r,cr,ce = Xlist.fold l ([],[],[]) (fun (r,controller,controllee) -> function
-      "subj" -> SUBJ :: r, controller, controllee
-    | "obj" -> OBJ :: r, controller, controllee
-    | "controller" -> r, "1" :: controller, controllee
-    | "controllee" -> r, controller, "1" :: controllee
-    | "controller2" -> r, "2" :: controller, controllee
-    | "controllee2" -> r, controller, "2" :: controllee
-    | "" -> r, controller, controllee
-    | x -> failwith ("parse_roles: " ^ x)) in
-  (match r with
-    [] -> ARG
-  | [x] -> x
-  | _ -> failwith "parse_roles"),cr,ce
-
-let parse_negation = function
-    [Text "_"] -> NegationUndef
-  | [Text "neg"] -> Negation
-  | [Text "aff"] -> Aff
-  | [Text ""] -> NegationNA
-  | l -> failwith ("parse_negation: " ^ ENIAMwalStringOf.token_list l)
-
-let parse_pred = function
-    [Text ""] -> PredNA
-  | [Text "pred"] -> Pred
-  | [Text "false"] -> PredNA
-  | [Text "true"] -> Pred
-  | l -> failwith ("parse_pred: " ^ ENIAMwalStringOf.token_list l)
-
-let parse_aspect = function
-      [Text "perf"] -> Aspect "perf"
-    | [Text "imperf"] -> Aspect "imperf"
-    | [Text "_"] -> AspectUndef
-    | [Text ""] -> AspectNA
-    | l -> failwith ("parse_aspect: " ^ ENIAMwalStringOf.token_list l)
+let rec string_of_token = function
+    Text s -> s
+  | Paren l -> "(" ^ String.concat "" (Xlist.map l string_of_token) ^ ")"
+  | Bracet l -> "{" ^ String.concat "" (Xlist.map l string_of_token) ^ "}"
+  | SqBra l -> "[" ^ String.concat "" (Xlist.map l string_of_token) ^ "]"
+  | LParen -> "("
+  | RParen -> ")"
+  | LBracet -> "{"
+  | RBracet -> "}"
+  | LSqBra -> "["
+  | RSqBra -> "]"
+  | Semic -> ";"
+  | Plus -> "+"
+  | Comma -> ","
+  | Quot  -> "'"
+
+let string_of_token_list l =
+  String.concat "" (Xlist.map l string_of_token)
  
 let parse_case = function
       [Text "nom"] -> Case "nom"
@@ -121,169 +111,15 @@ let parse_case = function
     | [Text "part"] -> Part
     | [Text "postp"] -> Case "postp"
     | [Text "agr"] -> CaseAgr
-    | l -> failwith ("parse_case: " ^ ENIAMwalStringOf.token_list l)
-
-let parse_prep = function
-    | [Text "niż"] -> "niż"
-    | [Text "w czasie"] -> "w czasie"
-    | [Text "podczas"] -> "podczas"
-    | [Text "w roli"] -> "w roli"
-    | [Text "pomiędzy"] -> "pomiędzy"
-    | [Text "według"] -> "według"
-    | [Text "zza"] -> "zza"
-    | [Text "poza"] -> "poza"
-    | [Text "spośród"] -> "spośród"
-    | [Text "spod"] -> "spod"
-    | [Text "koło"] -> "koło"
-    | [Text "względem"] -> "względem"
-    | [Text "wśród"] -> "wśród"
-    | [Text "wskutek"] -> "wskutek"
-    | [Text "przez"] -> "przez"
-    | [Text "co do"] -> "co do"
-    | [Text "wokół"] -> "wokół"
-    | [Text "między"] -> "między"
-    | [Text "bez"] -> "bez"
-    | [Text "przy"] -> "przy"
-    | [Text "na rzecz"] -> "na rzecz"
-    | [Text "na temat"] -> "na temat"
-    | [Text "po"] -> "po"
-    | [Text "u"] -> "u"
-    | [Text "pod"] -> "pod"
-    | [Text "ponad"] -> "ponad"
-    | [Text "jako"] -> "jako"
-    | [Text "w kwestii"] -> "w kwestii"
-    | [Text "w sprawie"] -> "w sprawie"
-    | [Text "ku"] -> "ku"
-    | [Text "przeciw"] -> "przeciw"
-    | [Text "nad"] -> "nad"
-    | [Text "z powodu"] -> "z powodu"
-    | [Text "przed"] -> "przed"
-    | [Text "od"] -> "od"
-    | [Text "o"] -> "o"
-    | [Text "w"] -> "w"
-    | [Text "za"] -> "za"
-    | [Text "dla"] -> "dla"
-    | [Text "na"] -> "na"
-    | [Text "z"] -> "z"
-    | [Text "do"] ->  "do"
-    | [Text "wobec"] -> "wobec"
-    | [Text "jak"] -> "jak"
-    | [Text "spomiędzy"] -> "spomiędzy"
-    | [Text "sponad"] -> "sponad"
-    | [Text "spopod"] -> "spopod"
-    | [Text "spoza"] -> "spoza"
-    | [Text "sprzed"] -> "sprzed"
-    | [Text "znad"] -> "znad"
-    | [Text "dokoła"] -> "dokoła"
-    | [Text "dookoła"] -> "dookoła"
-    | [Text "naokoło"] -> "naokoło"
-    | [Text "naprzeciw"] -> "naprzeciw"
-    | [Text "obok"] -> "obok"
-    | [Text "poniżej"] -> "poniżej"
-    | [Text "popod"] -> "popod"
-    | [Text "pośrodku"] -> "pośrodku"
-    | [Text "pośród"] -> "pośród"
-    | [Text "powyżej"] -> "powyżej"
-    | [Text "wewnątrz"] -> "wewnątrz"
-    | [Text "wkoło"] -> "wkoło"
-    | [Text "wzdłuż"] -> "wzdłuż"
-    | [Text "naokół"] -> "naokół"
-    | [Text "śród"] -> "śród"
-    | [Text "wpośród"] -> "wpośród"
-    | [Text "poprzez"] -> "poprzez"
-    | [Text "około"] -> "około"
-    | [Text "na punkcie"] -> "na punkcie"
-    | [Text "pod względem"] -> "pod względem"
-    | [Text "pod wpływem"] -> "pod wpływem"
-    | [Text "na skutek"] -> "na skutek"
-    | [Text "na polu"] -> "na polu"
-    | [Text "na poczet"] -> "na poczet"
-    | [Text "na widok"] -> "na widok"
-    | [Text "w dziedzinie"] -> "w dziedzinie"
-    | [Text "pod pozorem"] -> "pod pozorem"
-    | [Text "pod pretekstem"] -> "pod pretekstem"
-    | [Text "za pomocą"] -> "za pomocą"
-    | [Text "pod adresem"] -> "pod adresem"
-    | [Text "w kierunku"] -> "w kierunku"
-    | [Text "w stronę"] -> "w stronę"
-    | [Text "w obliczu"] -> "w obliczu"
-    | [Text "u podstaw"] -> "u podstaw"
-    | [Text "pod kątem"] -> "pod kątem"
-    | [Text "na okoliczność"] -> "na okoliczność"
-    | [Text "w temacie"] -> "w temacie"
-    | [Text "od strony"] -> "od strony"
-    | [Text "ze strony"] -> "ze strony"
-    | [Text "po stronie"] -> "po stronie"
-    | [Text "na myśl"] -> "na myśl"
-    | [Text "w charakterze"] -> "w charakterze"
-    | [Text "w zakresie"] -> "w zakresie"
-    | [Text "ze względu na"] -> "ze względu na"
-    | [Text "na podstawie"] -> "na podstawie"
-    | [Text "w stosunku do"] -> "w stosunku do"
-    | [Text "z tytułu"] -> "z tytułu"
-    | [Text "z okazji"] -> "z okazji"
-    | [Text "z zakresu"] -> "z zakresu"
-    | [Text "w wysokości"] -> "w wysokości"
-    | [Text "na gruncie"] -> "na gruncie"
-    | [Text "z dziedziny"] -> "z dziedziny"
-    | [Text "na tle"] -> "na tle"
-    | [Text "na niwie"] -> "na niwie"
-    | [Text "w ramach"] -> "w ramach"
-    | [Text "na korzyść"] -> "na korzyść"
-    | [Text "w intencji"] -> "w intencji"
-    | [Text "na kanwie"] -> "na kanwie"
-    | [Text "na niekorzyść"] -> "na niekorzyść"
-    | [Text "z ramienia"] -> "z ramienia"
-    | [Text "w wyniku"] -> "w wyniku"
-    | [Text "za sprawą"] -> "za sprawą"
-    | [Text "w imię"] -> "w imię"
-    | [Text "w celu"] -> "w celu"
-    | [Text "z pomocą"] -> "z pomocą"
-    | [Text "per"] -> "per"
-    | [Text "co"] -> "co"
-    | [Text s] -> s
-    | l -> failwith ("parse_prep: " ^ ENIAMwalStringOf.token_list l)
-
-let rec parse_comp = function
-      [Text "int"] -> Int,[]
-    | [Text "rel"] -> Rel,[]
-    | [Text "int";SqBra l] -> Int,List.flatten (Xlist.map (split_symbol Semic [] l) (fun c -> snd (parse_comp c)))
-    | [Text "rel";SqBra l] -> Rel,List.flatten (Xlist.map (split_symbol Semic [] l) (fun c -> snd (parse_comp c)))
-    | [Text "co"] -> CompTypeUndef,[Comp "co"] (* subst qub prep comp *)
-    | [Text "kto"] -> CompTypeUndef,[Comp "kto"] (* subst *)
-    | [Text "ile"] -> CompTypeUndef,[Comp "ile"] (* num adv *)
-    | [Text "jaki"] -> CompTypeUndef,[Comp "jaki"] (* adj *)
-    | [Text "który"] -> CompTypeUndef,[Comp "który"] (* adj *)
-    | [Text "czyj"] -> CompTypeUndef,[Comp "czyj"] (* adj *)
-    | [Text "jak"] -> CompTypeUndef,[Comp "jak"] (* prep conj adv *)
-    | [Text "kiedy"] -> CompTypeUndef,[Comp "kiedy"] (* comp adv *)
-    | [Text "gdzie"] -> CompTypeUndef,[Comp "gdzie"] (* qub adv *)
-    | [Text "odkąd"] -> CompTypeUndef,[Comp "odkąd"] (* adv *)
-    | [Text "skąd"] -> CompTypeUndef,[Comp "skąd"] (* adv *)
-    | [Text "dokąd"] -> CompTypeUndef,[Comp "dokąd"] (* adv *)
-    | [Text "którędy"] -> CompTypeUndef,[Comp "którędy"] (* adv *)
-    | [Text "dlaczego"] -> CompTypeUndef,[Comp "dlaczego"] (* adv *)
-    | [Text "czemu"] -> CompTypeUndef,[Comp "czemu"] (* adv *)
-    | [Text "czy"] -> CompTypeUndef,[Comp "czy"] (* qub conj *)
-    | [Text "jakby"] -> CompTypeUndef,[Comp "jakby"] (* qub comp *)
-    | [Text "jakoby"] -> CompTypeUndef,[Comp "jakoby"] (* qub comp *)
-    | [Text "gdy"] -> CompTypeUndef,[Gdy] (* adv; gdyby: qub comp *)
-    | [Text "dopóki"] -> CompTypeUndef,[Comp "dopóki"] (* comp *)
-    | [Text "zanim"] -> CompTypeUndef,[Comp "zanim"] (* comp *)
-    | [Text "jeśli"] -> CompTypeUndef,[Comp "jeśli"] (* comp *)
-    | [Text "żeby2"] -> CompTypeUndef,[Zeby]
-    | [Text "żeby"] -> CompTypeUndef,[Comp "żeby"] (* qub comp *)
-    | [Text "że"] -> CompTypeUndef,[Comp "że"] (* qub comp *)
-    | [Text "aż"] -> CompTypeUndef,[Comp "aż"] (* qub comp *)
-    | [Text "bo"] -> CompTypeUndef,[Comp "bo"] (* qub comp *)
-    | l -> failwith ("parse_comp: " ^ ENIAMwalStringOf.token_list l)
+    | [Text "_"] -> CaseUndef
+    | l -> failwith ("parse_case: " ^ string_of_token_list l)
  
 let parse_number = function
       [Text "sg"] -> Number "sg"
     | [Text "pl"] -> Number "pl"
     | [Text "agr"] -> NumberAgr
     | [Text "_"] -> NumberUndef
-    | l -> failwith ("parse_number: " ^ ENIAMwalStringOf.token_list l)
+    | l -> failwith ("parse_number: " ^ string_of_token_list l)
  
 let parse_gender = function
       [Text "m1"] -> Gender "m1"
@@ -291,247 +127,273 @@ let parse_gender = function
     | [Text "n"] -> Genders["n1";"n2"]
     | [Text "f"] -> Gender "f"
     | [Text "m1.n"] -> Genders["m1";"n1";"n2"]
+    | [Text "m1.n1.n2"] -> Genders["m1";"n1";"n2"]
+    | [Text "n1.n2"] -> Genders["n1";"n2"]
     | [Text "_"] -> GenderUndef
     | [Text "agr"] -> GenderAgr
-    | l -> failwith ("parse_gender: " ^ ENIAMwalStringOf.token_list l)
+    | l -> failwith ("parse_gender: " ^ string_of_token_list l)
  
 let parse_grad = function
       [Text "pos"] -> Grad "pos"
     | [Text "com"] -> Grad "com"
     | [Text "sup"] -> Grad "sup"
     | [Text "_"] -> GradUndef
-    | l -> failwith ("parse_grad: " ^ ENIAMwalStringOf.token_list l)
+    | l -> failwith ("parse_grad: " ^ string_of_token_list l)
+
+let parse_aspect = function
+      [Text "perf"] -> Aspect "perf"
+    | [Text "imperf"] -> Aspect "imperf"
+    | [Text "_"] -> AspectUndef
+    | [Text ""] -> AspectNA
+    | l -> failwith ("parse_aspect: " ^ string_of_token_list l)
+
+let parse_negation = function
+    [Text "_"] -> NegationUndef
+  | [Text "neg"] -> Negation
+  | [Text "aff"] -> Aff
+  | [Text ""] -> NegationNA
+  | l -> failwith ("parse_negation: " ^ string_of_token_list l)
  
 let parse_refl = function
-      [] -> ReflEmpty
+      (* [] -> ReflEmpty
     | [Text "się"] -> ReflSie
     | [Text ""] -> ReflEmpty
     | [Text "false"] -> ReflEmpty
-    | [Text "true"] -> ReflSie
-    | l -> failwith ("parse_refl: " ^ ENIAMwalStringOf.token_list l)
-
-let rec parse_lex = function
-      [Quot; Text "E"; Paren[Text gender]; Quot] -> Elexeme(parse_gender [Text gender])
-    | [Quot; Text x; Quot] -> Lexeme x
-    | [Quot; Text x; Comma; Text y; Quot] -> Lexeme (x ^ "," ^ y)
-    | [Text "OR"; Paren l] ->
-         (match split_symbol Semic [] l with
-           [l] -> (match split_symbol Comma [] l with
-               [_] -> failwith "parse_lex OR"
-             | ll -> ORconcat(Xlist.map ll parse_lex))
-         | ll -> ORcoord(Xlist.map ll parse_lex))
-    | [Text "XOR"; Paren l] -> XOR(Xlist.map (List.flatten (Xlist.map (split_symbol Semic [] l) (split_symbol Comma []))) parse_lex)
-    | l -> failwith ("parse_lex: " ^ ENIAMwalStringOf.token_list l)
-
-let get_lexeme = function
-    Lexeme s -> s
-  | _ -> failwith "get_lexeme"
-
-let new_schema r cr ce morfs =
-   {gf=r; role=""; role_attr="";sel_prefs=[]; cr=cr; ce=ce; dir=Both; morfs=morfs}
-
-let rec parse_restr = function
-      [Text "natr"] -> Natr,[]
-    | [Text "atr"] -> Atr,[]
-    | [Text "ratr"] -> Ratr,[]
-    | [Text "atr1"] -> Atr1,[]
-    | [Text "ratr1"] -> Ratr1,[]
-    | [Text "ratr1"; Paren schema] -> Ratr1, parse_schema_simple schema
-    | [Text "ratr"; Paren schema] -> Ratr, parse_schema_simple schema
-    | [Text "atr1"; Paren schema] -> Atr1, parse_schema_simple schema
-    | [Text "atr"; Paren schema] -> Atr, parse_schema_simple schema
-    | l -> failwith ("parse_restr: " ^ ENIAMwalStringOf.token_list l)
-
-and parse_schema_simple schema =
-  Xlist.map (split_symbol Plus [] schema) (function
-      [Bracet b] -> let r,cr,ce = parse_roles [] in new_schema r cr ce (parse_morfs b)
-    | [Text s1;Bracet b] -> let r,cr,ce = parse_roles [s1] in new_schema r cr ce (parse_morfs b)
-    | _ -> failwith "parse_schema_simple")
-
-and parse_mode = function
-      [Text "abl"] -> "abl",[]
-    | [Text "adl"] -> "adl",[]
-    | [Text "caus"] -> "caus",[]
-    | [Text "dest"] -> "dest",[]
-    | [Text "dur"] -> "dur",[]
-    | [Text "instr"] -> "instr",[]
-    | [Text "locat"] -> "locat",[]
-    | [Text "perl"] -> "perl",[]
-    | [Text "temp"] -> "temp",[]
-    | [Text "abl";SqBra l] -> "abl",parse_morfs l
-    | [Text "adl";SqBra l] -> "adl",parse_morfs l
-    | [Text "caus";SqBra l] -> "caus",parse_morfs l
-    | [Text "dest";SqBra l] -> "dest",parse_morfs l
-    | [Text "dur";SqBra l] -> "dur",parse_morfs l
-    | [Text "instr";SqBra l] -> "instr",parse_morfs l
-    | [Text "locat";SqBra l] -> "locat",parse_morfs l
-    | [Text "perl";SqBra l] -> "perl",parse_morfs l
-    | [Text "temp";SqBra l] -> "temp",parse_morfs l
-    | [Text "mod"] -> "mod",[]
-    | [Text "mod";SqBra l] -> "mod",parse_morfs l
-    | [Text "pron"] -> "pron",[]
-    | [Text "misc"] -> "misc",[]
-    | l -> failwith ("parse_mode: " ^ ENIAMwalStringOf.token_list l)
+    | [Text "true"] -> ReflSie *)
+  | [Text "nosię"] -> ReflFalse
+  | [Text "się"] -> ReflTrue
+  | l -> failwith ("parse_refl: " ^ string_of_token_list l)
+
+let parse_ctype = function
+    [Text "int"] -> Int
+  | [Text "rel"] -> Rel
+  | [Text "_"] -> CompTypeUndef
+  | l -> failwith ("parse_ctype: " ^ string_of_token_list l)
+
+let parse_acm = function
+    (* [Text "int"] -> Int
+  | [Text "rel"] -> Rel *)
+  | [Text "_"] -> AcmUndef
+  | l -> failwith ("parse_acm: " ^ string_of_token_list l)
+
+let parse_comp = function
+    | [Text "co"] -> Comp "co" (* subst qub prep comp *)
+    | [Text "kto"] -> Comp "kto" (* subst *)
+    | [Text "ile"] -> Comp "ile" (* num adv *)
+    | [Text "jaki"] -> Comp "jaki" (* adj *)
+    | [Text "który"] -> Comp "który" (* adj *)
+    | [Text "czyj"] -> Comp "czyj" (* adj *)
+    | [Text "jak"] -> Comp "jak" (* prep conj adv *)
+    | [Text "kiedy"] -> Comp "kiedy" (* comp adv *)
+    | [Text "gdzie"] -> Comp "gdzie" (* qub adv *)
+    | [Text "odkąd"] -> Comp "odkąd" (* adv *)
+    | [Text "skąd"] -> Comp "skąd" (* adv *)
+    | [Text "dokąd"] -> Comp "dokąd" (* adv *)
+    | [Text "którędy"] -> Comp "którędy" (* adv *)
+    | [Text "dlaczego"] -> Comp "dlaczego" (* adv *)
+    | [Text "czemu"] -> Comp "czemu" (* adv *)
+    | [Text "czy"] -> Comp "czy" (* qub conj *)
+    | [Text "jakby"] -> Comp "jakby" (* qub comp *)
+    | [Text "jakoby"] -> Comp "jakoby" (* qub comp *)
+    | [Text "gdy"] -> Gdy (* adv; gdyby: qub comp *)
+    | [Text "dopóki"] -> Comp "dopóki" (* comp *)
+    | [Text "zanim"] -> Comp "zanim" (* comp *)
+    | [Text "jeśli"] -> Comp "jeśli" (* comp *)
+    | [Text "żeby2"] -> Zeby
+    | [Text "żeby"] -> Comp "żeby" (* qub comp *)
+    | [Text "że"] -> Comp "że" (* qub comp *)
+    | [Text "aż"] -> Comp "aż" (* qub comp *)
+    | [Text "bo"] -> Comp "bo" (* qub comp *)
+    | [Text "niczym"] -> Comp "niczym"
+    | [Text "_"] -> CompUndef
+    | l -> failwith ("parse_comp: " ^ string_of_token_list l)
+
+let parse_opinion = function
+    "pewny" -> Pewny
+  (* | "cer" -> Pewny *)
+  | "potoczny" -> Potoczny
+  (* | "col" -> Potoczny *)
+  | "wątpliwy" -> Watpliwy
+  (* | "unc" -> Watpliwy *)
+  | "archaiczny" -> Archaiczny
+  (* | "dat" -> Archaiczny *)
+  | "zły" -> Zly
+  (* | "bad" -> Zly *)
+  | "wulgarny" -> Wulgarny
+  (* | "vul" -> Wulgarny *)
+  | x -> failwith ("parse_opinion: " ^ x)
+
+let parse_pred = function
+    "pred" -> PredTrue
+  | "nopred" -> PredFalse
+  | s -> failwith ("parse_pred: " ^ s)
+
+let parse_pos = function
+    "SUBST",[number;case] -> SUBST(parse_number number,parse_case case)
+  | "PPRON12",[number;case] -> PPRON12(parse_number number,parse_case case)
+  | "PPRON3",[number;case] -> PPRON3(parse_number number,parse_case case)
+  | "SIEBIE",[case] -> SIEBIE(parse_case case)
+  | "PREP",[case] -> PREP(parse_case case)
+  | "NUM",[case;gender;acm] -> NUM(parse_case case,parse_gender gender,parse_acm acm)
+  | "ADJ",[number;case;gender;grad] -> ADJ(parse_number number,parse_case case,parse_gender gender,parse_grad grad)
+  | "ADV",[grad] -> ADV(parse_grad grad)
+  | "GER",[number;case;gender;aspect;negation;refl] -> GER(parse_number number,parse_case case,parse_gender gender,parse_aspect aspect,parse_negation negation,parse_refl refl)
+  | "PPAS",[number;case;gender;aspect;negation] -> PPAS(parse_number number,parse_case case,parse_gender gender,parse_aspect aspect,parse_negation negation)
+  | "PACT",[number;case;gender;aspect;negation;refl] -> PACT(parse_number number,parse_case case,parse_gender gender,parse_aspect aspect,parse_negation negation,parse_refl refl)
+  | "INF",[aspect;negation;refl] -> INF(parse_aspect aspect,parse_negation negation,parse_refl refl)
+  | "QUB",[] -> QUB
+  | "COMPAR",[] -> COMPAR
+  | "COMP",[ctype] -> COMP(parse_ctype ctype)
+  | "PERS",[negation;refl] -> PERS(parse_negation negation,parse_refl refl)
+  | s,ll -> print_endline ("parse_pos: " ^ s ^ "(" ^ String.concat "," (Xlist.map ll string_of_token_list) ^ ")"); FIXED
+
+let rec parse_phrase = function
+    "np",[case] -> NP(parse_case case)
+  | "prepnp",[[Text prep]; case] -> PrepNP(prep,parse_case case)
+  | "adjp",[case] -> AdjP(parse_case case)
+  | "prepadjp",[[Text prep]; case] -> PrepAdjP(prep,parse_case case)
+  | "comprepnp",[[Text prep]] -> ComprepNP prep
+  | "comparp",[[Text prep]] -> ComparP prep
+  | "cp",[ctype;comp] -> CP(parse_ctype ctype,parse_comp comp)
+  | "ncp",[case;ctype;comp] -> NCP(parse_case case,parse_ctype ctype,parse_comp comp)
+  | "prepncp",[[Text prep];case;ctype;comp] -> PrepNCP(prep,parse_case case,parse_ctype ctype,parse_comp comp)
+  | "infp",[aspect] -> InfP(parse_aspect aspect)
+  | "fixed",[[Text lemma]] -> FixedP lemma
+  | "fixed",[[Text lemma1];[Text lemma2]] -> FixedP (lemma1 ^ "," ^ lemma2)
+  | "or",[] -> Or
+  | "refl",[] -> Refl
+  | "recip",[] -> Recip
+  | "E",[morf] -> E(parse_morf morf)
+  | "advp",[] -> AdvP
+  | "null",[] -> Null
+  | "lex",[[Text lemma];[Text pos; Paren p]] -> SimpleLexArg(lemma,parse_pos (pos, split_symbol Comma [] p))
+  | "lex",[[Text lemma];[Text pos]] -> SimpleLexArg(lemma,parse_pos (pos, []))
+  | "lex",[[Text id];[Text lemma];[Text pos; Paren p]] -> LexArg(int_of_string id,lemma,parse_pos (pos, split_symbol Comma [] p))
+  | "lex",[[Text id];[Text lemma];[Text pos]] -> LexArg(int_of_string id,lemma,parse_pos (pos, []))
+  | s,ll -> print_endline ("parse_phrase: " ^ s ^ "(" ^ String.concat "," (Xlist.map ll string_of_token_list) ^ ")"); Null
  
 and parse_morf = function
-    "np",[case] -> Phrase(NP(parse_case case))
-  | "prepnp",[prep; case] -> Phrase(PrepNP(Sem,parse_prep prep,parse_case case))
-  | "adjp",[case] -> Phrase(AdjP(parse_case case))
-  | "prepadjp",[prep; case] -> Phrase(PrepAdjP(Sem,parse_prep prep,parse_case case))
-  | "nump",[case] -> Phrase(NumP(parse_case case))
-  | "prepnump",[prep; case] -> Phrase(PrepNumP(Sem,parse_prep prep,parse_case case))
-  | "comprepnp",[prep] -> Phrase(ComprepNP(Sem,parse_prep prep))
-  | "compar",[prep] -> PhraseAbbr(ComparP(parse_prep prep),[])
-  | "cp",[comp] -> PhraseComp(Cp,parse_comp comp)
-  | "ncp",[case; comp] -> PhraseComp(Ncp(parse_case case),parse_comp comp)
-  | "prepncp",[prep; case; comp] -> PhraseComp(Prepncp(parse_prep prep,parse_case case),parse_comp comp)
-  | "infp",[aspect] -> Phrase(InfP(parse_aspect aspect(*,ReqUndef*)))
-  | "fixed",[morf;lex] -> Phrase(FixedP((*parse_morf_single morf,*) get_lexeme (parse_lex lex)))
-  | "fixed",[morf;lex;lex2] -> Phrase(FixedP((*parse_morf_single morf,*) get_lexeme (parse_lex (lex @ [Comma] @ lex2))))
-  | "or",[] -> Phrase Or
-  | "refl",[] -> Phrase (*Refl*)(Lex "się")
-  | "recip",[] -> Phrase (*Recip*)(Lex "się") (* FIXME *)
-  | "E",[] -> E Null
-  | "advp",[mode] -> let mode,morfs = parse_mode mode in PhraseAbbr(Advp mode,morfs)
-  | "xp",[mode] -> let mode,morfs = parse_mode mode in PhraseAbbr(Xp mode,morfs)
-  | "nonch",[] -> PhraseAbbr(Nonch,[])
-  | "distrp",[] -> PhraseAbbr(Distrp,[])
-  | "possp",[] -> PhraseAbbr(Possp,[])
-  | "null",[] -> Phrase Null
-  | "lex",[Text a; Paren p] :: ll -> parse_lex_morf (a, split_symbol Comma [] p, ll)
-  | "lex",[Text a] :: ll -> parse_lex_morf (a, [], ll)
-  | s,ll -> failwith ("parse_morf: " ^ s ^ "(" ^ String.concat "," (Xlist.map ll ENIAMwalStringOf.token_list) ^ ")")
-
-and parse_lex_morf = function
-  | "np",[case],[num;lex;restr] -> LexPhrase([SUBST(parse_number num,parse_case case),parse_lex lex], parse_restr restr)
-  | "prepnp",[prep; case],[num;lex;restr] -> LexPhrase([PREP(parse_case case),Lexeme(parse_prep prep);SUBST(parse_number num,parse_case case),parse_lex lex], parse_restr restr)
-  | "adjp",[case],[num;gender;grad;lex;restr] -> LexPhrase([ADJ(parse_number num,parse_case case,parse_gender gender,parse_grad grad),parse_lex lex], parse_restr restr)
-  | "prepadjp",[prep; case],[num;gender;grad;lex;restr] -> LexPhrase([PREP(parse_case case),Lexeme(parse_prep prep);ADJ(parse_number num,parse_case case,parse_gender gender,parse_grad grad),parse_lex lex], parse_restr restr)
-  | "ppasp",[case],[num;gender;negation;lex;restr] -> LexPhrase([PPAS(parse_number num,parse_case case,parse_gender gender,AspectUndef,parse_negation negation),parse_lex lex], parse_restr restr)
-  | "prepppasp",[prep;case],[num;gender;negation;lex;restr] -> LexPhrase([PREP(parse_case case),Lexeme(parse_prep prep);PPAS(parse_number num,parse_case case,parse_gender gender,AspectUndef,parse_negation negation),parse_lex lex], parse_restr restr)
-  | "pactp",[case],[num;gender;negation;lex;refl;restr] -> LexPhrase([PACT(parse_number num,parse_case case,parse_gender gender,AspectUndef,parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-  | "preppactp",[prep;case],[num;gender;negation;lex;refl;restr] -> LexPhrase([PREP(parse_case case),Lexeme(parse_prep prep);PACT(parse_number num,parse_case case,parse_gender gender,AspectUndef,parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-  | "gerp",[case],[num;negation;lex;refl;restr] -> LexPhrase([GER(parse_number num,parse_case case,GenderUndef,AspectUndef,parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-  | "prepgerp",[prep;case],[num;negation;lex;refl;restr] -> LexPhrase([PREP(parse_case case),Lexeme(parse_prep prep);GER(parse_number num,parse_case case,GenderUndef,AspectUndef,parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-  | "nump",[case],[lex1;lex2;restr] -> LexPhrase([NUM(parse_case case,GenderUndef,AcmUndef),parse_lex lex1;SUBST(NumberUndef,CaseUndef),parse_lex lex2], parse_restr restr)
-  | "prepnump",[prep;case],[lex1;lex2;restr] -> LexPhrase([PREP(parse_case case),Lexeme(parse_prep prep);NUM(parse_case case,GenderUndef,AcmUndef),parse_lex lex1;SUBST(NumberUndef,CaseUndef),parse_lex lex2], parse_restr restr)
-  | "compar",[prep],[morfs] -> LexPhrase([COMPAR,Lexeme(parse_prep prep)],(Ratrs,Xlist.map (split_symbol Plus [] morfs) (fun morf -> new_schema ARG [] [] [parse_morf_single morf])))
-  | "infp",[aspect],[negation;lex;refl;restr] -> LexPhrase([INF(parse_aspect aspect,parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-  | "qub",[],[lex;restr] -> LexPhrase([QUB,parse_lex lex], parse_restr restr)
-  | "advp",[mode],[grad;lex;restr] ->
-       (match parse_mode mode with
-          mode, [] -> LexPhraseMode(mode,[ADV(parse_grad grad),parse_lex lex], parse_restr restr)
-        | _ -> failwith "parse_lex_morf")
-  | "xp",[[Text mode;SqBra [Text "prepgerp"; Paren [prep;Comma;case]]]],[num;negation;lex;refl;restr] ->
-       LexPhraseMode(mode,[PREP(parse_case [case]),Lexeme(parse_prep [prep]);GER(parse_number num,parse_case [case],GenderUndef,AspectUndef,parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-  | "xp",[mode],ll ->
-       (match parse_mode mode,ll with
-          (mode,[Phrase(NP case)]),[num;lex;restr] -> LexPhraseMode(mode,[SUBST(parse_number num,case),parse_lex lex], parse_restr restr)
-        | (mode,[Phrase(PrepNP(_,prep,case))]),[num;lex;restr] -> LexPhraseMode(mode,[PREP case,Lexeme prep;SUBST(parse_number num,case),parse_lex lex], parse_restr restr)
-        | (mode,[Phrase(PrepAdjP(_,prep,case))]),[num;gender;grad;lex;restr] -> LexPhraseMode(mode,[PREP case,Lexeme prep;ADJ(parse_number num,case,parse_gender gender,parse_grad grad),parse_lex lex], parse_restr restr)
-        | (mode,[Phrase(NumP case)]),[lex1;lex2;restr] -> LexPhraseMode(mode,[NUM(case,GenderUndef,AcmUndef),parse_lex lex1;SUBST(NumberUndef,CaseUndef),parse_lex lex2], parse_restr restr)
-        | (mode,[Phrase(PrepNumP(_,prep,case))]),[lex1;lex2;restr] -> LexPhraseMode(mode,[PREP case,Lexeme prep;NUM(case,GenderUndef,AcmUndef),parse_lex lex1;SUBST(NumberUndef,CaseUndef),parse_lex lex2], parse_restr restr)
-        | (mode,[PhraseAbbr(Advp _,[])]),[grad;lex;restr] -> LexPhraseMode(mode,[ADV(parse_grad grad),parse_lex lex], parse_restr restr)
-        | (mode,[PhraseAbbr(ComparP prep,[])]),[morfs] -> LexPhraseMode(mode,[COMPAR,Lexeme prep],(Ratrs,Xlist.map (split_symbol Plus [] morfs) (fun morf -> new_schema ARG [] [] [parse_morf_single morf])))
-        | (mode,[PhraseComp(Cp,(ctype,[Comp comp]))]),[negation;lex;refl;restr] -> LexPhrase([COMP ctype,Lexeme comp;PERS(parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-        | _ -> failwith ("parse_lex_morf: xp(" ^ ENIAMwalStringOf.token_list mode ^ ")," ^ String.concat "," (Xlist.map ll ENIAMwalStringOf.token_list) ^ ")"))
-  | "cp",[comp],[negation;lex;refl;restr] ->
-       (match parse_comp comp with
-          ctype,[Comp comp] -> LexPhrase([COMP ctype,Lexeme comp;PERS(parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-        | ctype,[Comp comp1;Comp comp2] -> LexPhrase([COMP ctype,XOR[Lexeme comp1;Lexeme comp2];PERS(parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-        | _,comp -> failwith ("parse_lex_morf comp: " (*^ ENIAMwalStringOf.comp comp*)))
-  | "ncp",[case;comp],[negation;lex;refl;restr] ->
-       (match parse_comp comp with
-          ctype,[Comp comp] -> LexPhrase([SUBST(Number "sg",parse_case case),Lexeme "to";COMP ctype,Lexeme comp;PERS(parse_negation negation,parse_refl refl),parse_lex lex], parse_restr restr)
-        | _,comp -> failwith ("parse_lex_morf comp: " (*^ ENIAMwalStringOf.comp comp*)))
-  | s,ll,ll2 -> failwith ("parse_lex_morf: " ^ s ^ "(" ^ String.concat "," (Xlist.map ll ENIAMwalStringOf.token_list) ^ ")," ^ String.concat "," (Xlist.map ll2 ENIAMwalStringOf.token_list) ^ ")")
-
-and parse_morfs l =
-  let morfs = Xlist.map (split_symbol Semic [] l) (function
-    [Text a; Paren p] -> parse_morf (a, split_symbol Comma [] p)
-  | [Text a] -> parse_morf (a, [])
-  | l -> failwith ("parse_morfs: " ^ ENIAMwalStringOf.token_list l)) in
-(*   expand_prep_morfs equivs (expand_comp_morfs equivs morfs) *)morfs
-
-and parse_morf_single l = (* FIXME: problem z equivs *)
-  match parse_morfs l with
-    [x] -> x
-  | l -> failwith ("parse_morf_single: " ^ String.concat ";" (Xlist.map l ENIAMwalStringOf.morf))
-
-let split_schema schema =
-  find_brackets (Xlist.map (Str.full_split (Str.regexp "\\]\\|\\+\\|{\\|}\\|(\\|)\\|,\\|;\\|'\\|\\[") schema) (function
-      Str.Text s -> Text s
-    | Str.Delim "(" -> LParen
-    | Str.Delim ")" -> RParen
-    | Str.Delim "{" -> LBracet
-    | Str.Delim "}" -> RBracet
-    | Str.Delim "[" -> LSqBra
-    | Str.Delim "]" -> RSqBra
-    | Str.Delim ";" -> Semic
-    | Str.Delim "+" -> Plus
-    | Str.Delim "," -> Comma
-    | Str.Delim "'" -> Quot
-    | _ -> failwith "parse_schema"))
+    [Text a; Paren p] -> parse_phrase (a, split_symbol Comma [] p)
+  | [Text a] -> parse_phrase (a, [])
+  | l -> failwith ("parse_morf: " ^ string_of_token_list l)
  
-let parse_schema schema =
-  if schema = "" then [] else (
-  let l = split_schema schema in
-(*   print_endline schema; *)
+let parse_roles l =
+  let r,cr,ce,m = Xlist.fold l ([],[],[],[]) (fun (r,controller,controllee,m) -> function
+      "subj" -> SUBJ :: r, controller, controllee, m
+    | "obj" -> OBJ :: r, controller, controllee, m
+    | "controller" -> r, "1" :: controller, controllee, m
+    | "controllee" -> r, controller, "1" :: controllee, m
+    | "controller2" -> r, "2" :: controller, controllee, m
+    | "controllee2" -> r, controller, "2" :: controllee, m
+    | "misc" -> r, controller, controllee, "misc" :: m
+    | "locat" -> r, controller, controllee, "locat" :: m
+    | "abl" -> r, controller, controllee, "abl" :: m
+    | "adl" -> r, controller, controllee, "adl" :: m
+    | "caus" -> r, controller, controllee, "caus" :: m
+    | "mod" -> r, controller, controllee, "mod" :: m
+    | "temp" -> r, controller, controllee, "temp" :: m
+    | "dur" -> r, controller, controllee, "dur" :: m
+    | "possp" -> r, controller, controllee, "possp" :: m
+    | "perl" -> r, controller, controllee, "perl" :: m
+    | "instr" -> r, controller, controllee, "instr" :: m
+    | "dest" -> r, controller, controllee, "dest" :: m
+    | "distrp" -> r, controller, controllee, "distrp" :: m
+    | "lemma" -> r, controller, controllee, "lemma" :: m
+    | "refl" -> r, controller, controllee, "refl" :: m
+    | "recip" -> r, controller, controllee, "recip" :: m
+    | "nonch" -> r, controller, controllee, "nonch" :: m
+    | "pron" -> r, controller, controllee, "pron" :: m
+    | "" -> r, controller, controllee, m
+    | x -> failwith ("parse_roles: " ^ x)) in
+  (match r with
+    [] -> ARG
+  | [x] -> x
+  | _ -> failwith "parse_roles"),cr,ce,m
+
+let parse_schema = function
+    [] -> NoRestr,[]
+  | [Text "atr"] -> Atr,[]
+  | [Text "ratr"] -> Ratr,[]
+  | [Text "atr1"] -> Atr1,[]
+  | [Text "ratr1"] -> Ratr1,[]
+  | l -> NoRestr,Xlist.map (split_symbol Plus [] l) (function
+        [Bracet l] -> {empty_position with morfs=Xlist.map (split_symbol Semic [] l) parse_morf}
+      | [Text s; Bracet l] ->
+        let gf,cr,ce,m = parse_roles [s] in
+        {empty_position with gf=gf; cr=cr; ce=ce; mode=m; morfs=Xlist.map (split_symbol Semic [] l) parse_morf}
+      | l -> print_endline ("parse_schema: " ^ string_of_token_list l); empty_position)
+
+let parse_simple_morf = function
+    [Text id] -> MorfId (int_of_string id)
+  | l -> print_endline ("parse_simple_morf: " ^ string_of_token_list l); Null
+
+let parse_simple_schema l =
+  if l = [] then [] else
   Xlist.map (split_symbol Plus [] l) (function
-      [Bracet b] -> let r,cr,ce = parse_roles [] in new_schema r cr ce (parse_morfs b)
-    | [Text s1;Bracet b] -> let r,cr,ce = parse_roles [s1] in new_schema r cr ce (parse_morfs b)
-    | [Text s1;Comma;Text s2;Bracet b] -> let r,cr,ce = parse_roles [s1;s2] in new_schema r cr ce (parse_morfs b)
-    | [Text s1;Comma;Text s2;Comma;Text s3;Bracet b] -> let r,cr,ce = parse_roles [s1;s2;s3] in new_schema r cr ce (parse_morfs b)
-    | _ -> failwith ("parse_schema: " ^ schema)))
-
-let parse_lexeme s =
-  match Str.split (Str.regexp " ") s with
-    [s] -> s,""
-  | [s;"się"] -> s,"się"
-  | _ -> failwith ("parse_lexeme: " ^ s)
-
-let load_frames filename =
-  Xlist.fold (List.tl (Str.split (Str.regexp "\n") (File.load_file filename))) StringMap.empty (fun schemas line ->
-    if String.sub line 0 1 = "%" then schemas else
-    match Str.split_delim (Str.regexp ": ") line with
-      [lexeme;opinion;negation;pred;aspect;schema] ->
-         let lexeme,refl = parse_lexeme lexeme in
-         StringMap.add_inc schemas lexeme [refl,opinion,negation,pred,aspect,schema] (fun l -> (refl,opinion,negation,pred,aspect,schema) :: l)
-    | _ -> failwith ("load_frames: " ^ line))
-
-
-
-let rec extract_fixed_schema fixed schema =
-  Xlist.fold schema fixed (fun fixed s ->
-    Xlist.fold s.morfs fixed (fun fixed -> function
-            Phrase(FixedP s) -> StringSet.add fixed s
-          | LexPhrase(_,(_,schema)) -> extract_fixed_schema fixed schema
-          | LexPhraseMode(_,_,(_,schema)) -> extract_fixed_schema fixed schema
-          | _ -> fixed))
-
-(*let extract_fixed fixed_filename = (* FIXME: nie wykrywa fixed w argumentach leksykalizacji *)
-(*   let expands,compreps,comprep_reqs,subtypes,equivs = load_realizations () in *)
-  let fixed = Xlist.fold Paths.walenty_filenames StringSet.empty (fun fixed filename ->
-(*     print_endline filename; *)
-    let frames = load_frames (Paths.walenty_path ^ filename) in
-    StringMap.fold frames fixed (fun fixed _ l ->
-      Xlist.fold l fixed (fun fixed (refl,opinion,negation,pred,aspect,schema) ->
-        extract_fixed_schema fixed (parse_schema schema)))) in
-  let entries = StringSet.fold fixed StringSet.empty (fun entries s ->
-    let tokens = List.rev (Xlist.fold (Str.full_split (Str.regexp " \\|,") s) [] (fun l -> function
-        Str.Text t -> t :: l
-      | Str.Delim " " -> l
-      | Str.Delim t -> t :: l)) in
-    let tokens_string = String.concat " " tokens in
-    Xlist.fold tokens entries (fun entries token ->
-      StringSet.add entries (Printf.sprintf "%s\t%s\t%s:fixed\tfixed" token s tokens_string))) in
-  File.file_out fixed_filename (fun file ->
-    StringSet.iter entries (fun entry ->
-      Printf.fprintf file "%s\n" entry))
-
-(* generowanie fixed.tab *)
-(* let _ = extract_fixed "data/fixed.tab" *)
+        [Bracet l] ->
+        let morfs = Xlist.map (split_symbol Semic [] l) parse_simple_morf in
+        {empty_position with morfs=morfs}
+      | [Text s; Bracet l] ->
+        let gf,cr,ce,m = parse_roles [s] in
+        let morfs = Xlist.map (split_symbol Semic [] l) parse_simple_morf in
+        {empty_position with gf=gf; cr=cr; ce=ce; mode=m; morfs=morfs}
+      | [Text s1; Comma; Text s2; Bracet l] ->
+        let gf,cr,ce,m = parse_roles [s1;s2] in
+        let morfs = Xlist.map (split_symbol Semic [] l) parse_simple_morf in
+        {empty_position with gf=gf; cr=cr; ce=ce; mode=m; morfs=morfs}
+      | [Text s1; Comma; Text s2; Comma; Text s3; Bracet l] ->
+        let gf,cr,ce,m = parse_roles [s1;s2;s3] in
+        let morfs = Xlist.map (split_symbol Semic [] l) parse_simple_morf in
+        {empty_position with gf=gf; cr=cr; ce=ce; mode=m; morfs=morfs}
+      | [Text s1; Comma; Text s2; Comma; Text s3; Comma; Text s4; Bracet l] ->
+        let gf,cr,ce,m = parse_roles [s1;s2;s3;s4] in
+        let morfs = Xlist.map (split_symbol Semic [] l) parse_simple_morf in
+        {empty_position with gf=gf; cr=cr; ce=ce; mode=m; morfs=morfs}
+      | l -> print_endline ("parse_simple_schema: " ^ string_of_token_list l); empty_position)
+
+let parse_entry (restr,schema) = function
+    [Text "lex"; Paren[Text lemma;Comma;Text pos]] -> SimpleLexEntry(lemma,pos)
+  | [Text "lex"; Paren[Text id;Comma;Text lemma;Comma;Text pos]] -> LexEntry(int_of_string id,lemma,pos,restr,schema)
+  | [Text "comprepnp"; Paren[Text lemma]] -> ComprepNPEntry(lemma,restr,schema)
+  | l -> print_endline ("parse_entry: " ^ string_of_token_list l); SimpleLexEntry("","")
+
+let load_entries filename =
+  let l = File.load_tab filename (function
+        [pos; lemma; entry; schema] -> pos, lemma, entry, schema
+      | [pos; lemma; entry] -> pos, lemma, entry, ""
+      | _ -> failwith "load_entries") in
+  Xlist.fold l Entries.empty (fun entries (pos,lemma,entry,schema) ->
+      let schema = parse_schema (split_text schema) in
+      let entry = parse_entry schema (split_text entry) in
+      Entries.add_inc entries pos lemma entry)
+
+let load_phrases filename =
+  let l = File.load_tab filename (function
+        id :: morfs -> int_of_string id, morfs
+      | _ -> failwith "load_phrases") in
+  Xlist.fold l IntMap.empty (fun phrases (id,morfs) ->
+      (* print_endline (string_of_int id); *)
+      let morfs = Xlist.map morfs (fun morf -> parse_morf (split_text morf)) in
+      IntMap.add phrases id morfs)
+
+let load_schemata filename =
+  let l = File.load_tab filename (function
+        [pos; lemma; opinion; neg; pred; aspect; schema] -> pos, lemma, opinion, neg, pred, aspect, schema
+      | _ -> failwith "load_schemata") in
+  Xlist.fold l Entries.empty (fun entries (pos,lemma,opinion,neg,pred,aspect,schema) ->
+      let opinion = parse_opinion opinion in
+      let neg = parse_negation [Text neg] in
+      let pred = parse_pred pred in
+      let aspect = parse_aspect [Text aspect] in
+      let schema = parse_simple_schema (split_text schema) in
+      let entry = opinion,neg,pred,aspect,schema in
+      Entries.add_inc entries pos lemma entry)
+
+let phrases = load_phrases "results/phrases.tab"
+let entries = load_entries "results/entries.tab"
+let schemata = load_schemata "results/schemata.tab"
  
+(*
 let print_subjs () =
 (*   let expands,compreps,comprep_reqs,subtypes,equivs = load_realizations () in *)
   let subjs = Xlist.fold Paths.walenty_filenames StringQMap.empty (fun subjs filename ->
@@ -560,18 +422,4 @@ let print_ctrls () =
       Printf.printf "%5d %s\n" v s)
  
 (* let _ = print_ctrls () *)
-
-(* Test parsowania *)
-(*let _ =
-  let expands,compreps,comprep_reqs,subtypes,equivs = load_realizations () in
-  Xlist.iter Paths.walenty_filenames (fun filename ->
-    print_endline filename;
-    let frames = load_frames (Paths.walenty_path ^ filename) in
-    StringMap.iter frames (fun _ l ->
-      Xlist.iter l (fun (refl,opinion,negation,pred,aspect,schema) ->
-(*       print_endline schema; *)
-        ignore (parse_opinion opinion);
-        ignore (parse_negation [Text negation]);
-        ignore (parse_pred [Text pred]);
-        ignore (parse_aspect [Text aspect]);
-        ignore (expand_equivs_schema equivs (expand_subtypes subtypes (expand_schema expands (parse_schema schema)))))))*)*)
+*)
@@ -17,31 +17,21 @@
  *  along with this program.  If not, see <http://www.gnu.org/licenses/>.
  *)
  
-open ENIAMwalTypes
+open ENIAMwalTypes2
 open Xstd
  
 let rec expand_schema_morf expands = function
-    PhraseAbbr(Advp "misc",[]) -> PhraseAbbr(Advp "misc",[])
-  | PhraseAbbr(Advp "mod",[]) -> PhraseAbbr(Advp "mod",[])
-  (* | PhraseAbbr(ComparP s,[]) -> PhraseAbbr(ComparP s,[Phrase(ComparNP(s,Str));Phrase(ComparPP(s))]) (* FIXME: albo do walTEI albo usunąć *) *)
+    PhraseAbbr(Advp "misc",[]) -> PhraseAbbr(Advp "misc",[Phrase AdvP])
+  | PhraseAbbr(Advp "mod",[]) -> PhraseAbbr(Advp "mod",[Phrase AdvP])
   | PhraseAbbr(abbr,[]) -> (try PhraseAbbr(abbr,AbbrMap.find expands abbr) with Not_found -> failwith "expand_schema_morf")
   | PhraseAbbr(abbr,morfs) -> PhraseAbbr(abbr,Xlist.map morfs (expand_schema_morf expands))
   | LexPhrase(pos_lex,(restr,schema)) -> LexPhrase(pos_lex,(restr,expand_schema expands schema))
-  (* | LexPhraseMode(mode,pos_lex,(restr,schema)) -> LexPhraseMode(mode,pos_lex,(restr,expand_schema expands schema)) *)
   | morf -> morf
  
 and expand_schema expands schema =
   Xlist.map schema (fun s ->
       {s with morfs=Xlist.map s.morfs (expand_schema_morf expands)})
  
-(* let get_mode = function
-    Xp(m) -> m
-  | Advp(m) -> m
-  (* | ComparP prep -> "compar" *)
-  | Nonch -> "nonch"
-  | Distrp -> "distrp"
-  | Possp -> "possp" *)
-
 let rec expand_subtypes_morf subtypes = function
     PhraseComp(comp_morf,(ctype,comps)) ->
       let comps = if comps = [] then (try CompMap.find subtypes ctype with Not_found -> failwith "expand_subtypes_schema") else comps in
@@ -50,18 +40,8 @@ let rec expand_subtypes_morf subtypes = function
         | Ncp case -> NCP(case,ctype,comp)
         | Prepncp(prep,case) -> PrepNCP(prep,case,ctype,comp)))
   | LexPhrase(pos_lex,(restr,schema)) -> [LexPhrase(pos_lex,(restr,expand_subtypes subtypes schema))]
-  (* | LexPhraseMode(mode,pos_lex,(restr,schema)) -> [LexPhraseMode(mode,pos_lex,(restr,expand_subtypes subtypes schema))] *)
   | PhraseAbbr(abbr,morfs) ->
-    (* let mode = get_mode abbr in *)
     List.flatten (Xlist.map morfs (expand_subtypes_morf subtypes))
-    (* Xlist.map morfs (function
-          Phrase p -> PhraseMode(mode,p)
-        | PhraseMode(_,p) -> PhraseMode(mode,p)
-        | LexPhrase(pos_lex,r) -> LexPhraseMode(mode,pos_lex,r)
-        | LexRPhrase(pos_lex,r) -> LexRPhraseMode(mode,pos_lex,r)
-        | LexPhraseMode(m,pos_lex,r) -> LexPhraseMode(mode,pos_lex,r)
-        | LexRPhraseMode(m,pos_lex,r) -> LexRPhraseMode(mode,pos_lex,r)
-        | _ -> failwith "expand_subtypes_morf") *)
   | E Null -> [E(NP(Str));E(NCP(Str,CompTypeUndef,CompUndef));E(CP(CompTypeUndef,CompUndef)); E(Or)]
   | morf -> [morf]
  
@@ -74,7 +54,6 @@ let expand_equivs_phrase equivs = function
   | PrepAdjP(prep,case) -> Xlist.map (try StringMap.find equivs prep with Not_found -> [prep]) (fun prep -> PrepAdjP(prep,case))
   | PrepNumP(prep,case) -> Xlist.map (try StringMap.find equivs prep with Not_found -> [prep]) (fun prep -> PrepNumP(prep,case))
   | ComprepNP(prep)  -> Xlist.map (try StringMap.find equivs prep with Not_found -> [prep]) (fun prep -> ComprepNP(prep))
-  (* | ComparNP(prep,case) -> Xlist.map (try StringMap.find equivs prep with Not_found -> [prep]) (fun prep -> ComparNP(prep,case)) *)
   | ComparP(prep)  -> Xlist.map (try StringMap.find equivs prep with Not_found -> [prep]) (fun prep -> ComparP(prep))
   | CP(ctype,Comp comp) -> Xlist.map (try StringMap.find equivs comp with Not_found -> [comp]) (fun comp -> CP(ctype,Comp comp))
   | NCP(case,ctype,Comp comp) -> Xlist.map (try StringMap.find equivs comp with Not_found -> [comp]) (fun comp -> NCP(case,ctype,Comp comp))
@@ -93,80 +72,27 @@ let rec expand_equivs_lex equivs = function
  
 let rec expand_equivs_morf equivs = function
     Phrase phrase -> Xlist.map (expand_equivs_phrase equivs phrase) (fun phrase -> Phrase phrase)
-  (* | PhraseMode(mode,phrase) -> Xlist.map (expand_equivs_phrase equivs phrase) (fun phrase -> PhraseMode(mode,phrase)) *)
   | E phrase -> Xlist.map (expand_equivs_phrase equivs phrase) (fun phrase -> E phrase)
   | LexPhrase(pos_lex,(restr,schema)) -> [LexPhrase(Xlist.map pos_lex (fun (pos,lex) -> pos, expand_equivs_lex equivs lex),(restr,expand_equivs_schema equivs schema))]
-  (* | LexRPhrase(pos_lex,(restr,schema)) -> [LexRPhrase(Xlist.map pos_lex (fun (pos,lex) -> pos, expand_equivs_lex equivs lex),(restr,expand_equivs_schema equivs schema))]
-  | LexPhraseMode(mode,pos_lex,(restr,schema)) -> [LexPhraseMode(mode,Xlist.map pos_lex (fun (pos,lex) -> pos, expand_equivs_lex equivs lex),(restr,expand_equivs_schema equivs schema))]
-  | LexRPhraseMode(mode,pos_lex,(restr,schema)) -> [LexRPhraseMode(mode,Xlist.map pos_lex (fun (pos,lex) -> pos, expand_equivs_lex equivs lex),(restr,expand_equivs_schema equivs schema))] *)
-(* | PhraseAbbr(abbr,morfs) -> [PhraseAbbr(abbr,List.flatten (Xlist.map morfs (expand_equivs_morf equivs)))] *)
   | morf -> failwith ("expand_equivs_morf: " ^ ENIAMwalStringOf.morf morf)
  
 and expand_equivs_schema equivs schema =
   Xlist.map schema (fun s ->
     {s with morfs=List.flatten (Xlist.map s.morfs (expand_equivs_morf equivs))})
  
-
-let rec load_realizations_rec (expands,subtypes,equivs) found rev = function
-    [] -> if rev <> [] || found <> [] then failwith "load_realizations_rec" else expands,subtypes,equivs
-  | [Str.Text s; Str.Delim "-->"] :: l -> load_realizations_rec (expands,subtypes,equivs) ((s,rev) :: found) [] l
-  | [Str.Delim "    "; Str.Text s; Str.Delim "\t"; Str.Text t] :: l ->
-       load_realizations_rec (expands,subtypes,equivs) found ((s,t) :: rev) l
-  | [Str.Delim "    "; Str.Text s] :: l ->
-       load_realizations_rec (expands,subtypes,equivs) found ((s,"") :: rev) l
-  | [Str.Delim "% "; Str.Text "Phrase types expand:"] :: l -> load_realizations_rec (found,subtypes,equivs) [] rev l
-  | [Str.Delim "% "; Str.Text "Attributes subtypes:"] :: l -> load_realizations_rec (expands,found,equivs) [] rev l
-  | [Str.Delim "% "; Str.Text "Attributes equivalents:"] :: l -> load_realizations_rec (expands,subtypes,found) [] rev l
-(*   | [Str.Delim "% "; Str.Text s] :: l -> print_endline s; load_realizations_rec found rev l *)
-  | [] :: l -> load_realizations_rec (expands,subtypes,equivs) found rev l
-  | _ -> failwith "load_realizations_rec"
-
-(* let find_comprep_reqs compreps =
-  Xlist.fold compreps StringMap.empty (fun comprep_reqs (s,l) ->
-    let l = Xlist.map l (function
-        LexPhrase(pos_lex,_) -> Xlist.fold pos_lex StringSet.empty (fun set -> function
-            _,Lexeme s -> StringSet.add set s
-          | _ -> set)
-      (* | LexPhraseMode(_,pos_lex,_) -> Xlist.fold pos_lex StringSet.empty (fun set -> function
-            _,Lexeme s -> StringSet.add set s
-          | _ -> set) *)
-      | morf -> failwith ("find_compreps_reqs: " ^ ENIAMwalStringOf.morf morf)) in
-    if l = [] then failwith "find_compreps_reqs";
-    StringMap.add comprep_reqs s (StringSet.to_list (Xlist.fold (List.tl l) (List.hd l) StringSet.union))) *)
-
-(* let create_comprep_dict compreps =
-  Xlist.fold compreps StringMap.empty (fun compreps (s,l) ->
-    Xlist.fold l compreps (fun compreps -> function
-        LexPhrase([PREP _,_;SUBST _,lex],_) as morf ->
-          let lexemes = get_lexemes lex in
-          Xlist.fold lexemes compreps (fun compreps lexeme ->
-            StringMap.add_inc compreps lexeme ["subst",(s,morf)] (fun l -> ("subst",(s,morf)) :: l))
-      (* | LexPhraseMode("misc",[ADV grad,lex],restr) ->
-          let morf = LexPhrase([ADV grad,lex],restr) in
-          let lexemes = get_lexemes lex in
-          Xlist.fold lexemes compreps (fun compreps lexeme ->
-            StringMap.add_inc compreps lexeme ["adv",(s,morf)] (fun l -> ("adv",(s,morf)) :: l)) *)
-      | LexPhrase([PREP _,_;NUM _,_;SUBST _,lex],_) as morf ->
-          let lexemes = get_lexemes lex in
-          Xlist.fold lexemes compreps (fun compreps lexeme ->
-            StringMap.add_inc compreps lexeme ["subst",(s,morf)] (fun l -> ("subst",(s,morf)) :: l))
-      | morf -> failwith ("create_comprep_dict: " ^ ENIAMwalStringOf.morf morf))) *)
-
-let load_realizations () =
-  (* let lines = Str.split (Str.regexp "\n") (File.load_file realizations_filename) in
-  let lines = Xlist.rev_map lines (fun line -> Str.full_split (Str.regexp "% \\|-->\\|    \\|\t") line) in
-  let expands,subtypes,equivs = load_realizations_rec ([],[],[]) [] [] lines in *)
-  let subtypes = Xlist.fold ENIAMwalTEI.subtypes CompMap.empty (fun subtypes -> function
+(* UWAGA: aktualnie equivs nie są wstawiane do expands *)
+let load_realizations (expands,subtypes,equivs) =
+  let subtypes = Xlist.fold subtypes CompMap.empty (fun subtypes -> function
       "int",l -> CompMap.add subtypes Int (List.flatten (Xlist.map l (fun v -> snd(ENIAMwalTEI.parse_comp v))))
     | "rel",l -> CompMap.add subtypes Rel (List.flatten (Xlist.map l (fun v -> snd(ENIAMwalTEI.parse_comp v))))
     | _ -> failwith "load_realizations 1") in
-  let equivs = Xlist.fold ENIAMwalTEI.equivs StringMap.empty (fun equivs (k,l) -> StringMap.add equivs k (k :: l)) in
-  let expands,compreps = Xlist.fold ENIAMwalTEI.expands (AbbrMap.empty,[]) (fun (expands, compreps) (id,k,l) ->
+  let equivs = Xlist.fold equivs StringMap.empty (fun equivs (k,l) -> StringMap.add equivs k (k :: l)) in
+  let expands,compreps = Xlist.fold expands (AbbrMap.empty,[]) (fun (expands, compreps) (id,k,l) ->
     match k with
         PhraseAbbr(Advp m,[]) -> AbbrMap.add expands (Advp m) l, compreps
       | PhraseAbbr(Nonch,[]) -> AbbrMap.add expands Nonch l, compreps
       | PhraseAbbr(Xp m,[]) -> AbbrMap.add expands (Xp m) (List.flatten (Xlist.map l (function
-             PhraseAbbr(Advp m,[]) -> (try AbbrMap.find expands (Advp m) with Not_found -> [PhraseAbbr(Advp m,[])]) (* FIXME: zakładam, że advp się nie rozmnoży *)
+             PhraseAbbr(Advp m,[]) -> (try AbbrMap.find expands (Advp m) with Not_found -> [PhraseAbbr(Advp m,[])]) (* zakładam, że advp się nie rozmnoży *)
           | morf -> [morf]))), compreps
       | Phrase(ComprepNP s) -> expands, (s, l) :: compreps
       | PhraseAbbr(Distrp,[]) -> AbbrMap.add expands Distrp l, compreps
@@ -174,53 +100,4 @@ let load_realizations () =
       | _ -> failwith "load_realizations 2") in
   let compreps = Xlist.map compreps (fun (s,morfs) ->
     s, List.flatten (List.flatten (Xlist.map morfs (fun morf -> Xlist.map (expand_subtypes_morf subtypes (expand_schema_morf expands morf)) (expand_equivs_morf equivs))))) in
-  (* let comprep_reqs = find_comprep_reqs compreps in *)
-  (* let compreps = create_comprep_dict compreps in *)
-  expands,compreps,(*comprep_reqs,*)subtypes,equivs
-
-let expands,compreps,(*comprep_reqs,*)subtypes,equivs = load_realizations ()
-
-
-(* Wypisanie realizacji *)
-(* let _ =
-  Xlist.iter ENIAMwalTEI.expands (fun (id,morf,l) ->
-      Printf.printf "%d %s:\n" id (ENIAMwalStringOf.morf morf);
-      Xlist.iter l (fun morf -> Printf.printf "    %s\n" (ENIAMwalStringOf.morf morf))) *)
-
-(* Wypisanie realizacji po przetworzeniu *)
-(* let _ =
-  AbbrMap.iter expands (fun morf l ->
-      Printf.printf "%s:\n" (ENIAMwalStringOf.phrase_abbr morf);
-      Xlist.iter l (fun morf -> Printf.printf "    %s\n" (ENIAMwalStringOf.morf morf))) *)
-
-let has_realization = function
-    PhraseAbbr _ -> true
-  | PhraseComp _ -> true
-  | _ -> false
-
-(* Wypisanie fraz, które podlegają rozwijaniu *)
-(*let _ =
-  IntMap.iter ENIAMwalTEI.phrases (fun i morf ->
-      if has_realization morf then
-      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf morf)) *)
-
-let phrases =
-  IntMap.map ENIAMwalTEI.phrases (fun morf ->
-      let morf = expand_schema_morf expands morf in
-      let morfs = expand_subtypes_morf subtypes morf in
-      let morf = List.flatten (Xlist.map morfs (expand_equivs_morf equivs)) in
-      morf)
-
-(* Wypisanie fraz, które podlegają rozwijaniu *)
-(* let _ =
-  IntMap.iter phrases (fun i morf ->
-      if has_realization morf then
-      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf morf)) *)
-
-(* let test_phrases = [17088; 17133; 1642]
-let _ =
-  Xlist.iter test_phrases (fun i ->
-      let m1 = IntMap.find ENIAMwalTEI.phrases i in
-      let m2 = IntMap.find phrases i in
-      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf m1);
-      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf m2)) *)
+  expands,compreps,subtypes,equivs
+(*
+ *  ENIAMwalenty, an interface for Polish Valence Dictionary "Walenty".
+ *  Copyright (C) 2016 Wojciech Jaworski <wjaworski atSPAMfree mimuw dot edu dot pl>
+ *  Copyright (C) 2016 Institute of Computer Science Polish Academy of Sciences
+ *
+ *  This library is free software: you can redistribute it and/or modify
+ *  it under the terms of the GNU Lesser General Public License as published by
+ *  the Free Software Foundation, either version 3 of the License, or
+ *  (at your option) any later version.
+ *
+ *  This library is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU Lesser General Public License for more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ *)
+
+open ENIAMwalTypes
+open Xstd
+
+(* let rec assign_pro_args schema =
+  Xlist.map schema (fun s ->
+      let morfs = match s.morfs with
+          (E p) :: l -> E Pro :: (E p) :: l
+        | [LexPhrase _] as morfs -> morfs
+        | [Phrase(FixedP _)] as morfs -> morfs
+        | [Phrase(Lex _)] as morfs -> morfs
+        (*    | [Phrase Refl] as morfs -> morfs
+              | [Phrase Recip] as morfs -> morfs*)
+        | Phrase Null :: _ as morfs -> morfs
+        | Phrase Pro :: _ as morfs -> morfs
+        | morfs -> if s.gf <> SUBJ && s.cr = [] && s.ce = [] then (Phrase Null) :: morfs else (Phrase Pro) :: morfs in (* FIXME: ustalić czy są inne przypadki uzgodnienia *)
+      (*     let morfs = assign_pro_args_lex morfs in *) (* bez pro wewnątrz leksykalizacji *)
+      {s with morfs=morfs}) *)
+
+(*let assign_pro_args_lex morfs =
+  Xlist.map morfs (function
+      Lex(morf,specs,lex,restr) -> LexN(morf,specs,lex,assign_pro_args_restr restr)
+    | LexNum(morf,lex1,lex2,restr) -> LexNum(morf,lex1,lex2,assign_pro_args_restr restr)
+    | LexCompar(morf,l) -> LexCompar(morf,make_gfs_lex l)
+    | morf -> morf)
+
+  and assign_pro_args_restr = function
+    Natr -> Natr
+  | Ratr1 schema -> Ratr1(assign_pro_args schema)
+  | Atr1 schema -> Atr1(assign_pro_args schema)
+  | Ratr schema -> Ratr(assign_pro_args schema)
+  | Atr schema -> Atr(assign_pro_args schema)*)
+
+exception ImpossibleSchema
+
+let rec reduce_comp lexemes = function
+    Comp s -> if StringMap.mem lexemes s then Comp s else raise Not_found
+  | Zeby -> if StringMap.mem lexemes "żeby" || StringMap.mem lexemes "że" then Zeby else raise Not_found
+  | Gdy -> if StringMap.mem lexemes "gdy" || StringMap.mem lexemes "gdyby" then Gdy else raise Not_found
+  | CompUndef -> failwith "reduce_comp"
+
+let reduce_phrase comprep_reqs lexemes = function
+  | PrepNP(prep,case) as phrase -> if StringMap.mem lexemes prep then phrase else raise Not_found
+  | PrepAdjP(prep,case) as phrase -> if StringMap.mem lexemes prep then phrase else raise Not_found
+  | ComprepNP(prep) as phrase  -> if Xlist.fold (try StringMap.find comprep_reqs prep with Not_found -> []) true (fun b s -> b && StringMap.mem lexemes s) then phrase else raise Not_found
+  | ComparP(prep) as phrase  -> if StringMap.mem lexemes prep then phrase else raise Not_found
+  | CP(ctype,comp) -> CP(ctype,reduce_comp lexemes comp)
+  | NCP(case,ctype,comp) -> if StringMap.mem lexemes "to" then NCP(case,ctype,reduce_comp lexemes comp) else raise Not_found
+  | PrepNCP(prep,case,ctype,comp) -> if StringMap.mem lexemes prep && StringMap.mem lexemes "to" then PrepNCP(prep,case,ctype,reduce_comp lexemes comp) else raise Not_found
+  | SimpleLexArg(lemma,_) as phrase  -> if StringMap.mem lexemes lemma then phrase else raise Not_found
+  | LexArg(_,lemma,_) as phrase  -> if StringMap.mem lexemes lemma then phrase else raise Not_found
+  | FixedP lemma as phrase  -> if StringMap.mem lexemes lemma then phrase else raise Not_found
+  | phrase -> phrase
+
+let rec reduce_morfs comprep_reqs lexemes = function
+    [] -> []
+  | morf :: l -> (try [reduce_phrase comprep_reqs lexemes morf] with Not_found -> []) @ reduce_morfs comprep_reqs lexemes l
+
+let rec reduce_schema2 comprep_reqs lexemes = function
+    [] -> []
+  | s :: l ->
+    let morfs = reduce_morfs comprep_reqs lexemes s.morfs in
+    if morfs = [] then reduce_schema2 comprep_reqs lexemes l else
+      {s with morfs=morfs} :: reduce_schema2 comprep_reqs lexemes l
+
+let rec reduce_schema comprep_reqs lexemes = function
+    [] -> []
+  | s :: l ->
+    let morfs = reduce_morfs comprep_reqs lexemes s.morfs in
+    if morfs = [] then raise ImpossibleSchema else
+      {s with morfs=morfs} :: reduce_schema comprep_reqs lexemes l
+
+(* let reduce_schema_frame lexemes = function
+    Frame(atrs,schema) -> Frame(atrs,reduce_schema lexemes schema)
+  (*  | ComprepFrame(s,morfs) ->
+        let morfs = reduce_morfs lexemes morfs in
+        if morfs = [] then raise ImpossibleSchema else ComprepFrame(s,morfs)*)
+  | _ -> failwith "reduce_schema_frame" *)
+
+
+let reduce_entries lexemes entries =
+  StringMap.map entries (fun entries ->
+      StringSet.fold lexemes StringMap.empty (fun reduced lemma ->
+          try StringMap.add reduced lemma (StringMap.find entries lemma)
+          with Not_found -> reduced))
@@ -17,26 +17,7 @@
  *  along with this program.  If not, see <http://www.gnu.org/licenses/>.
  *)
  
-open ENIAMwalTypes
-
-(*let rec token = function
-    Text s -> s
-  | Paren l -> "(" ^ String.concat "" (Xlist.map l token) ^ ")"
-  | Bracet l -> "{" ^ String.concat "" (Xlist.map l token) ^ "}"
-  | SqBra l -> "[" ^ String.concat "" (Xlist.map l token) ^ "]"
-  | LParen -> "("
-  | RParen -> ")"
-  | LBracet -> "{"
-  | RBracet -> "}"
-  | LSqBra -> "["
-  | RSqBra -> "]"
-  | Semic -> ";"
-  | Plus -> "+"
-  | Comma -> ","
-  | Quot  -> "'"
-
-let token_list l =
-  String.concat "" (Xlist.map l token)*)
+open ENIAMwalTypes2
  
 let opinion = function
     Pewny -> "pewny"
@@ -87,10 +68,7 @@ let rec comp = function
 let rec comp_type = function
    Int -> "int"
  | Rel -> "rel"
- (* | Sub -> "sub"
- | Coord -> "coord" *)
  | CompTypeUndef -> "_"
- (* | CompTypeAgr -> "agr" *)
  
 let number = function
     Number s -> s
@@ -117,29 +95,16 @@ let acm = function
     Acm s -> s
   | AcmUndef -> "_"
  
-(* let sem = function
-    Sem -> "sem"
-  | NoSem -> "nosem" *)
-
-(*let req = function
-    Req -> ",req"
-  | NReq -> ",nreq"
-  | ReqUndef -> ""*)
-
 let gf = function
     SUBJ -> "subj"
   | OBJ -> "obj"
   | ARG -> "arg"(*""*)
-  (* | CORE -> "core"
-  | NOSEM -> "nosem"
-  | NOGF -> "nogf"
-  | ADJUNCT -> "adjunct"
-  | RAISED -> "raised"
-  | CLAUSE -> "clause"
-  | SENTENCE -> "sentence" *)
  
 let pos = function
     SUBST(n,c) -> "SUBST(" ^ number n ^ "," ^ case c ^ ")"
+  | PPRON12(n,c) -> "PPRON12(" ^ number n ^ "," ^ case c ^ ")"
+  | PPRON3(n,c) -> "PPRON3(" ^ number n ^ "," ^ case c ^ ")"
+  | SIEBIE(c) -> "SIEBIE(" ^ case c ^ ")"
   | PREP(c) -> "PREP(" ^ case c ^ ")"
   | NUM(c,g,a) -> "NUM(" ^ case c ^ "," ^ gender g ^ "," ^ acm a ^ ")"
   | ADJ(n,c,g,gr) -> "ADJ(" ^ number n ^ "," ^ case c ^ "," ^ gender g ^ "," ^ grad gr ^ ")"
@@ -162,7 +127,6 @@ let phrase = function
   | NumP(c) -> "nump(" ^ case c ^ ")"
   | PrepNumP(prep,c) -> "prepnump(" ^ prep ^ "," ^ case c ^ ")"
   | ComprepNP(prep) -> "comprepnp(" ^ prep ^ ")"
-  (* | ComparNP(prep,c) -> "comparnp(" ^ prep ^ "," ^ case c ^ ")" *)
   | ComparP(prep) -> "comparp(" ^ prep ^ ")"
   | CP(ct,co) -> "cp(" ^ comp_type ct ^ "," ^ comp co ^ ")"
   | NCP(c,ct,co) -> "ncp(" ^ case c ^ "," ^ comp_type ct ^ "," ^ comp co ^ ")"
@@ -172,11 +136,9 @@ let phrase = function
   | FixedP s -> "fixed(" ^ s ^ ")"
   | Num(c,a) -> "num(" ^ case c ^ "," ^ acm a ^ ")"
   | Or -> "or"
-  | Refl -> "refl"
-  | Recip -> "recip"
   | Qub -> "qub"
-  | Pro -> "pro"
-  | ProNG -> "prong"
+  (* | Pro -> "pro"
+  | ProNG -> "prong" *)
   | Null -> "null"
   | GerP c -> "gerp(" ^ case c ^ ")"
   | PrepGerP(prep,c) -> "prepgerp(" ^ prep ^ "," ^ case c ^ ")"
@@ -188,7 +150,6 @@ let phrase = function
 let phrase_abbr = function
     Xp(m) -> "xp(" ^ m ^ ")"
   | Advp(m) -> "advp(" ^ m ^ ")"
-  (* | ComparP prep -> "compar(" ^ prep ^ ")" *)
   | Nonch -> "nonch"
   | Distrp -> "distrp"
   | Possp -> "possp"
@@ -212,13 +173,7 @@ let restr = function
   | Ratrs -> "ratrs"
   | Atr1 -> "atr1"
   | Ratr1 -> "ratr1"
-(*  | Ratr1,s -> "ratr1(" ^ schema s ^ ")"
-  | Atr1,s -> "atr1(" ^ schema s ^ ")"
-  | Ratr,s -> "ratr(" ^ schema s ^ ")"
-  | Atr,s -> "atr(" ^ schema s ^ ")"
-  | Ratrs,s -> "ratrs(" ^ schema s ^ ")"
- *) | NoRestr -> ""
-(*   | NoRestr,s -> schema s *)
+  | NoRestr -> ""
  
 let controllers l =
   Xlist.map l (function
@@ -230,42 +185,10 @@ let controllees l =
       "1" -> "controllee"
     | n -> "controllee" ^ n)
  
-(*let lex_specs = function
-    NSpecs num -> number num
-  | AdvSpecs gr -> grad gr
-  | AdjSpecs(num,g,gr) -> number num ^ "," ^ gender g ^ "," ^ grad gr
-  | PpasSpecs(num,g,neg) -> number num ^ "," ^ gender g ^ "," ^ negation neg
-  | PactSpecs(num,g,neg,r) -> number num ^ "," ^ gender g ^ "," ^ negation neg ^ "," ^ refl r
-  | GerSpecs(num,neg,r) -> number num ^ "," ^ negation neg ^ "," ^ refl r
-  | CSpecs(neg,r) -> negation neg ^ "," ^ refl r
-  | NumSpecs g -> gender g
-  | EmptySpecs -> ""*)
-
-let mood = function
-    (*Mood*) s -> s
-  (*| MoodUndef -> "_"*)
-
-let tense t = t
-
-let aux = function
-    NoAux -> "-"
-  | PastAux -> "aux-past"
-  | FutAux -> "aux-fut"
-  | ImpAux -> "aux-imp"
-
-let nsem = function
-    Common s -> s
-  | Time -> "time"
-
-(* let direction = function
-    Forward -> "/"
-  | Backward  -> "\\"
-  | Both -> "|" *)
-
 let rec schema schema =
   String.concat "+" (Xlist.map schema (fun s ->
     String.concat "," (
-      (if s.gf = ARG then [] else [gf s.gf])@
+      (if s.gf = ARG then [] else [gf s.gf])@s.mode@
       (if s.role = "" then [] else [s.role])@
       (if s.role_attr = "" then [] else [s.role_attr])@
       (*s.sel_prefs@*)(controllers s.cr)@(controllees s.ce)) ^ "{" ^  String.concat ";" (Xlist.map s.morfs morf) ^ "}"))
@@ -276,82 +199,38 @@ let rec schema schema =
  
 and morf = function
     Phrase p -> phrase p
-  (* | PhraseMode(m,p) -> m ^ ":" ^ phrase p *)
   | E p -> "E(" ^ phrase p ^ ")"
   | LexPhrase(pos_lex,(r,s)) -> "lex([" ^ String.concat ";" (Xlist.map pos_lex (fun (p,le) -> pos p ^ "," ^ lex le)) ^ "]," ^ restr r ^ "[" ^ schema s ^ "])"
-  (* | LexRPhrase(pos_lex,(r,s)) -> "lex([" ^ String.concat ";" (Xlist.map pos_lex (fun (p,le) -> pos p ^ "," ^ lex le)) ^ "]," ^ restr r ^ "[" ^ schema s ^ "])" *)
-  (* | LexPhraseMode(m,pos_lex,(r,s)) -> "lex([" ^ m ^ "," ^ String.concat ";" (Xlist.map pos_lex (fun (p,le) -> pos p ^ "," ^ lex le)) ^ "]," ^ restr r ^ "[" ^ schema s ^ "])" *)
-  (* | LexRPhraseMode(m,pos_lex,(r,s)) -> "lex([" ^ m ^ "," ^ String.concat ";" (Xlist.map pos_lex (fun (p,le) -> pos p ^ "," ^ lex le)) ^ "]," ^ restr r ^ "[" ^ schema s ^ "])" *)
   | PhraseAbbr(p,ml) -> phrase_abbr p ^ "[" ^ String.concat ";" (Xlist.map ml morf) ^ "]"
   | PhraseComp(p,(ct,l)) -> phrase_comp p ^ "," ^ comp_type ct ^ "[" ^ String.concat ";" (Xlist.map l comp) ^ "]"
-  (* | LexPhraseId(id,p,le) -> "lex(" ^ id ^ "," ^ pos p ^ "," ^ lex le ^ ")"
-  | LexArg(id,p,le) -> "lex(" ^ id ^ "," ^ pos p ^ "," ^ le ^ ")" *)
-  (* | LexPhraseId(id,p,le) -> "lex(" ^ id ^ "," ^ pos p ^ "," ^ lex le ^ ")" *)
   | MorfId id -> Printf.sprintf "id(%d)" id
   | SimpleLexArg(le,p) -> "lex(" ^ le ^ "," ^ pos p ^ ")"
   | LexArg(id,le,p) -> "lex(" ^ string_of_int id ^ "," ^ le ^ "," ^ pos p ^ ")"
-(*  | LexRealization(mrf,le) -> "lex(" ^ morf mrf ^ "," ^ le ^ ")"*)
-  (* | Raised(mrf1,dir,mrf2) -> "raised([" ^ String.concat ";" mrf1 ^ "]," ^ direction dir ^ "[" ^ String.concat ";" mrf2 ^ "])"
-  | Multi l -> "multi(" ^ String.concat ";" (Xlist.map l phrase) ^ ")" *)
-
-(*and mode = function
-    Mode(s,[]) -> s
-  | Mode(s,l) -> s ^ "[" ^ "..."(*String.concat ";" (Xlist.map l morf)*) ^ "]"
-(*   | Mod l -> "mod[...]"  *)
-  | Pron [] -> "pron"
-  | Pron l -> "pron" ^ "[" ^ "..."(*String.concat ";" (Xlist.map l morf)*) ^ "]"
-  | Misc -> "misc"*)
-
-let meaning m =
-  m.name ^ "-" ^ m.variant
  
-let frame_atrs = function
-    DefaultAtrs(m,r,o,neg,p,a) -> Printf.sprintf "%s: %s: %s: %s: %s: %s" (String.concat "; " (Xlist.map m meaning)) (refl r) (opinion o) (negation neg) (pred p) (aspect a)
-  | EmptyAtrs m -> Printf.sprintf "%s" (String.concat "; " (Xlist.map m meaning))
-  | NounAtrs(m,nsyn,s(*,typ*)) -> Printf.sprintf "%s: %s: %s" (String.concat "; " (Xlist.map m meaning)) nsyn (nsem s) (*(String.concat ";" typ)*)
-  | AdjAtrs(m,c,adjsyn(*,adjsem,typ*)) -> Printf.sprintf "%s: %s: %s" (String.concat "; " (Xlist.map m meaning)) (case c) adjsyn (*adjsem (String.concat ";" typ)*)
-  | PersAtrs(m,le,neg,mo,t,au,a) -> Printf.sprintf "%s: %s: %s: %s: %s: %s: %s" (String.concat "; " (Xlist.map m meaning)) le (negation neg) (mood mo) (tense t) (aux au) (aspect a)
-  | GerAtrs(m,le,neg,a) -> Printf.sprintf "%s: %s: %s: %s" (String.concat "; " (Xlist.map m meaning)) le (negation neg) (aspect a)
-  | NonPersAtrs(m,le,role,role_attr,neg,a) -> Printf.sprintf "%s: %s: %s,%s: %s: %s" (String.concat "; " (Xlist.map m meaning)) le role role_attr (negation neg) (aspect a)
-  | _ -> failwith "WalStringOf.frame_atrs"
+let simple_morf = function
+  | MorfId id -> Printf.sprintf "%d" id
+  | _ -> failwith "ENIAMwalStringOf.simple_morf"
  
-let frame lexeme = function
-    Frame(atrs,s) ->
-      Printf.sprintf "%s: %s: %s" lexeme (frame_atrs atrs) (schema s)
-  | SimpleLexEntry(le,p) ->
-      Printf.sprintf "%s: %s" le p
-  | LexEntry(id,le,p,r,s) ->
-    Printf.sprintf "%d: %s: %s: %s: %s" id le p (restr r) (schema s)
-  | ComprepNPEntry(le,r,s) ->
-      Printf.sprintf "%s: %s: %s" le (restr r) (schema s)
-  (* | LexFrame(id,p,r,s) ->
-    Printf.sprintf "%s: %s: %s: %s: %s" lexeme id (pos p) (restr r) (schema s)
-  | ComprepFrame(le,p,r,s) ->
-    Printf.sprintf "%s: %s: %s: %s: %s" lexeme le (pos p) (restr r) (schema s) *)
-(*  | FrameR(atrs,s) ->
-      Printf.sprintf "%s: %s: %s" lexeme (frame_atrs atrs) (schema_role s)
-  | LexFrameR(id,p,r,s) ->
-      Printf.sprintf "%s: %s: %s: %s: %s" lexeme id (pos p) (restr r) (schema_role s)
-  | ComprepFrameR(le,p,r,s) ->
-      Printf.sprintf "%s: %s: %s: %s: %s" lexeme le (pos p) (restr r) (schema_role s)*)
-(*   | _ -> failwith "WalStringOf.frame" *)
+let rec simple_schema schema =
+  String.concat "+" (Xlist.map schema (fun s ->
+      String.concat "," (
+        (if s.gf = ARG then [] else [gf s.gf])@
+        s.mode@(controllers s.cr)@(controllees s.ce)) ^
+      "{" ^  String.concat ";" (Xlist.map s.morfs simple_morf) ^ "}"))
  
-let entry = function
-    Frame(atrs,s) ->
-    Printf.sprintf "%s: %s: %s" "lexeme" (frame_atrs atrs) (schema s)
-  | SimpleLexEntry(le,p) ->
-    Printf.sprintf "%s: %s" le p
-  | LexEntry(id,le,p,r,s) ->
-    Printf.sprintf "%d: %s: %s: %s: %s" id le p (restr r) (schema s)
-  | ComprepNPEntry(le,r,s) ->
-    Printf.sprintf "%s: %s: %s" le (restr r) (schema s)
  
-(* let fnum_frame lexeme = function
-    fnum,Frame(atrs,s) ->
-      Printf.sprintf "%d: %s: %s: %s" fnum lexeme (frame_atrs atrs) (schema s)
-  | fnum,LexFrame(id,p,r,s) ->
-      Printf.sprintf "%d: %s: %s: %s: %s: %s" fnum lexeme id (pos p) (restr r) (schema s)
-  | fnum,ComprepFrame(le,p,r,s) ->
-      Printf.sprintf "%d: %s: %s: %s: %s: %s" fnum lexeme le (pos p) (restr r) (schema s) *)
+let meaning m =
+  m.name ^ "-" ^ m.variant
  
-let unparsed_frame lexeme (r,o,neg,p,a,s) = lexeme ^ " " ^ String.concat ": " [r;o;neg;p;a;s]
+let lex_entry = function
+    SimpleLexEntry(le,p) ->
+    Printf.sprintf "lex(%s,%s)" le p
+  | LexEntry(id,le,p,NoRestr,s) ->
+    Printf.sprintf "lex(%d,%s,%s)\t%s" id le p (schema s)
+  | LexEntry(id,le,p,r,[]) ->
+    Printf.sprintf "lex(%d,%s,%s)\t%s" id le p (restr r)
+  | ComprepNPEntry(le,NoRestr,s) ->
+    Printf.sprintf "comprepnp(%s)\t%s" le (schema s)
+  | ComprepNPEntry(le,r,[]) ->
+    Printf.sprintf "comprepnp(%s)\t%s" le (restr r)
+  | _ -> failwith "ENIAMwalStringOf.lex_entry"
@@ -18,7 +18,7 @@
  *  along with this program.  If not, see <http://www.gnu.org/licenses/>.
  *)
  
-open ENIAMwalTypes
+open ENIAMwalTypes2
 open Xstd
  
 type id = {hash: bool; suffix: string; numbers: int list}
@@ -261,6 +261,10 @@ let rec process_lex lex = function
       (ENIAMwalStringOf.lex lemma) (ENIAMwalStringOf.lex numeral_lemma) in
     failwith ("process_lex: " ^ s)
  
+(* UWAGA: refl_id może się zmienić wraz z wersją Walentego *)
+let refl_id = 25
+let refl_position = {empty_position with role="Lemma"; mode=["lemma"]; morfs=[MorfId refl_id]}
+
 let rec load_category = function
   | F("category",Fs("category_def",x)) ->
     (match x with
@@ -321,7 +325,7 @@ and load_phrase mode = function
   | Fs("advp", [e;F("category",Symbol a)]) -> mode:=a :: !mode; PhraseAbbr(Advp(a),[])
   | Fs("nonch", []) -> mode:="nonch" :: !mode; PhraseAbbr(Nonch,[])
   | Fs("or", []) -> Phrase Or
-  | Fs("refl", []) -> Phrase Refl
+  | Fs("refl", []) -> mode:="refl" :: !mode; LexPhrase([QUB,Lexeme "się"],(Natr,[]))
   | Fs("E", []) -> E Null
   | Fs("lex", x) ->
     let lex = Xlist.fold x empty_lex load_lex in
@@ -330,7 +334,7 @@ and load_phrase mode = function
   | Fs("fixed", [F("argument",a);F("string",TEIstring b)]) -> Phrase (FixedP((*snd (load_phrase a),*)b))
   | Fs("possp", [e]) -> mode:="possp" :: !mode; PhraseAbbr(Possp,[])
   | Fs("possp", []) -> mode:="possp" :: !mode; PhraseAbbr(Possp,[])
-  | Fs("recip", []) -> Phrase Recip
+  | Fs("recip", []) -> mode:="recip" :: !mode; LexPhrase([QUB,Lexeme "się"],(Natr,[]))
   | Fs("distrp", [e]) -> mode:="distrp" :: !mode; PhraseAbbr(Distrp,[])
   | Fs("distrp", []) -> mode:="distrp" :: !mode; PhraseAbbr(Distrp,[])
   | Fs("compar", [F("compar_category",Symbol value)]) -> Phrase(ComparP value)
@@ -395,8 +399,7 @@ let parse_opinion = function
  
 let load_schema_info ent phrases (arg:schema) = function
   | F("opinion",Symbol opinion_value) -> {arg with opinion = parse_opinion opinion_value}
-  | F("inherent_sie",Binary true) -> {arg with reflexiveMark = ReflTrue}
-  | F("inherent_sie",Binary false) -> {arg with reflexiveMark = ReflFalse}
+  | F("inherent_sie",Binary b) -> {arg with reflexiveMark = b}
   | F("aspect",Symbol aspect_value) -> {arg with aspect = parse_aspect aspect_value}
   | Fset("aspect", []) -> arg
   | F("negativity",Symbol negativity_value) -> {arg with negativity = parse_negation negativity_value}
@@ -411,7 +414,7 @@ let load_schema_info ent phrases (arg:schema) = function
  
 let load_schema ent phrases = function
     Fs("schema", schema) ->
-    let result = {sch_id = (-1); opinion = OpinionUndef; reflexiveMark = ReflUndef; aspect = AspectUndef;
+    let result = {sch_id = (-1); opinion = OpinionUndef; reflexiveMark = false; aspect = AspectUndef;
                   negativity = NegationUndef; predicativity = PredUndef; positions = []; text_rep=""} in
     let result = Xlist.fold schema result (load_schema_info ent phrases) in
     result
@@ -587,22 +590,6 @@ let load_rentry = function
     id,morf,expansions
   | xml -> failwith ("load_entry: \n" ^ Xml.to_string_fmt xml)
  
-let load_expands filename =
-  begin
-    match Xml.parse_file filename with
-      Xml.Element("TEI", _,
-                  [Xml.Element("teiHeader",_,_) ;
-                   Xml.Element("text",[],[Xml.Element("body",[],entries)])]) ->
-      List.rev (Xlist.rev_map entries load_rentry)
-    | _ -> failwith "load_walenty"
-  end
-
-
-   (*let walenty = load_walenty Paths.walenty_filename *)
-let walenty,phrases = load_walenty "/home/yacheu/Dokumenty/NLP resources/Walenty/walenty_20170311.xml"
-
-(* let _ = Printf.printf "|phrases|=%d\n" (IntMap.size phrases) *)
-
 let expands_supplement = [
   (-2), PhraseAbbr(Nonch,[]), [
     LexPhrase([SUBST(NumberUndef,Str),Lexeme "co"],(Natr,[]));
@@ -615,7 +602,15 @@ let expands_supplement = [
     LexPhrase([ADV (Grad "pos"),Lexeme "jak"],(Natr,[]))
     ]]
  
-let expands = expands_supplement @ load_expands "/home/yacheu/Dokumenty/NLP resources/Walenty/phrase_types_expand_20170311.xml"
+let load_expands filename =
+  begin
+    match Xml.parse_file filename with
+      Xml.Element("TEI", _,
+                  [Xml.Element("teiHeader",_,_) ;
+                   Xml.Element("text",[],[Xml.Element("body",[],entries)])]) ->
+      expands_supplement @ List.rev (Xlist.rev_map entries load_rentry)
+    | _ -> failwith "load_walenty"
+  end
  
 let subtypes = [
   "int",[
@@ -42,6 +42,9 @@ type gf = SUBJ | OBJ | ARG
  
 type pos =
     SUBST of number * case
+  | PPRON12 of number * case
+  | PPRON3 of number * case
+  | SIEBIE of case
   | PREP of case
   | NUM of case * gender * acm
   | ADJ of number * case * gender * grad
@@ -84,39 +87,13 @@ type phrase =
   | PpasP of case
   | PrepPpasP of string * case
   | PactP of case
-
-type phrase_abbr =
-    Xp of string
-  | Advp of string
-  | Nonch
-  | Distrp
-  | Possp
-
-type phrase_comp =
-    Cp
-  | Ncp of case
-  | Prepncp of string * case
-
-type lex =
-    Lexeme of string
-  | ORconcat of lex list
-  | ORcoord of lex list
-  | XOR of lex list
-  | Elexeme of gender
+  | SimpleLexArg of string * pos
+  | LexArg of int * string * pos
+  | E of phrase
+  | MorfId of int
  
 type restr = Natr | Ratr | Ratrs | Ratr1 | Atr | Atr1 | NoRestr
  
-(*type lex_specs =
-    NSpecs of number
-  | AdvSpecs of grad
-  | AdjSpecs of number * gender * grad
-  | PpasSpecs of number * gender * negation
-  | PactSpecs of number * gender * negation * refl
-  | GerSpecs of number * negation * refl
-  | CSpecs of negation * refl
-  | NumSpecs of gender
-  | EmptySpecs *)
-
 type sel_prefs =
     SynsetId of int
   | Predef of string
@@ -124,49 +101,11 @@ type sel_prefs =
   | RelationRole of string * string * string (* relacji * rola * atrybut roli *)
  
 type position = {psn_id: int; gf: gf; role: string; role_attr: string; sel_prefs: sel_prefs list;
-                 mode: string list; cr: string list; ce: string list; morfs: morf list}
-
-and morf =
-    Phrase of phrase
-  (* | PhraseMode of string * phrase *)
-  | E of phrase
-  | LexPhrase of (pos * lex) list * (restr * position list)
-  (* | LexRPhrase of (pos * lex) list * (restr * position list) *)
-  (* | LexPhraseMode of string * (pos * lex) list * (restr * position list) *)
-  (* | LexRPhraseMode of string * (pos * lex) list * (restr * position list) *)
-  | PhraseAbbr of phrase_abbr * morf list
-  | PhraseComp of phrase_comp * (comp_type * comp list)
-  (* | LexPhraseId of string * pos * lex
-  | LexArg of string * pos * string *)
-  | MorfId of int
-(*  | LexRealization of morf * string*)
-(*  | Raised of string list * direction * string list
-    | Multi of phrase list*)
-  | SimpleLexArg of string * pos
-  | LexArg of int * string * pos
+                 mode: string list; cr: string list; ce: string list; morfs: phrase list}
  
 let empty_position =
   {psn_id=(-1); gf=ARG; role=""; role_attr=""; mode=[]; sel_prefs=[]; cr=[]; ce=[]; morfs=[]}
  
-type lex_record = {
-  lex_argument: morf;
-  lex_arguments: morf list;
-  lex_lemma: lex;
-  lex_numeral_lemma: lex;
-  lex_mode: string list;
-  lex_negation: negation;
-  lex_degree: grad;
-  lex_number: number;
-  lex_reflex: refl;
-  lex_gender: gender;
-  lex_modification: restr * position list;
-}
-
-let empty_lex = {lex_argument=Phrase Null; lex_arguments=[]; lex_lemma=Lexeme "";
-                 lex_numeral_lemma=Lexeme ""; lex_mode=[]; lex_negation=NegationUndef;
-                 lex_degree=GradUndef; lex_number=NumberUndef; lex_reflex=ReflUndef;
-                 lex_gender=GenderUndef; lex_modification = Natr,[]}
-
 type meaning = {mng_id: int;
                 name: string;
                 variant: string;
@@ -211,21 +150,6 @@ end
  
 module EntrySet = Xset.Make(OrderedEntry)
  
-module OrderedAbbr = struct
-  type  t = phrase_abbr
-  let compare = compare
-end
-
-module AbbrMap = Xmap.Make(OrderedAbbr)
-
-module OrderedComp = struct
-  type  t = comp_type
-  let compare = compare
-end
-
-(* module MorfSet = Xset.Make(OrderedMorf) *)
-module CompMap = Xmap.Make(OrderedComp)
-
 let resource_path =
   try Sys.getenv "ENIAM_RESOURCE_PATH"
   with Not_found -> "/usr/share/eniam"
+(*
+ *  ENIAMwalenty, an interface for Polish Valence Dictionary "Walenty".
+ *  Copyright (C) 2016 Wojciech Jaworski <wjaworski atSPAMfree mimuw dot edu dot pl>
+ *  Copyright (C) 2016 Institute of Computer Science Polish Academy of Sciences
+ *
+ *  This library is free software: you can redistribute it and/or modify
+ *  it under the terms of the GNU Lesser General Public License as published by
+ *  the Free Software Foundation, either version 3 of the License, or
+ *  (at your option) any later version.
+ *
+ *  This library is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU Lesser General Public License for more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ *)
+
+open Xstd
+
+type opinion = Dobry | Pewny | Potoczny | Watpliwy | Archaiczny | Zly | Wulgarny | Domyslny | OpinionUndef
+type negation = Negation | Aff | NegationUndef | NegationNA
+type pred = PredTrue | PredFalse | PredUndef | PredNA
+type aspect = Aspect of string | AspectUndef | AspectNA
+type case = Case of string | Str | Part | CaseAgr | NomAgr | GenAgr | AllAgr | CaseUndef | AllUAgr | CaseUAgr
+type comp = Comp of string | Zeby | Gdy | CompUndef
+type comp_type = Int | Rel | CompTypeUndef
+type number = Number of string | NumberUndef | NumberAgr
+type gender = Gender of string | GenderUndef | GenderAgr | Genders of string list
+type grad = Grad of string | GradUndef
+type refl = ReflEmpty | ReflTrue | ReflFalse | ReflUndef
+type acm = Acm of string | AcmUndef
+
+type gf = SUBJ | OBJ | ARG
+
+type pos =
+    SUBST of number * case
+  | PPRON12 of number * case
+  | PPRON3 of number * case
+  | SIEBIE of case
+  | PREP of case
+  | NUM of case * gender * acm
+  | ADJ of number * case * gender * grad
+  | ADV of grad
+  | GER of number * case * gender * aspect * negation * refl
+  | PACT of number * case * gender * aspect * negation * refl
+  | PPAS of number * case * gender * aspect * negation
+  | INF of aspect * negation * refl
+  | QUB
+  | COMPAR
+  | COMP of comp_type
+  | PERS of (*number * gender * aspect * person * *)negation * refl
+  | FIXED
+
+type phrase =
+    NP of case
+  | PrepNP of string * case
+  | AdjP of case
+  | PrepAdjP of string * case
+  | NumP of case
+  | PrepNumP of string * case
+  | ComprepNP of string
+  | ComparP of string (** case*)
+  | CP of comp_type * comp
+  | NCP of case * comp_type * comp
+  | PrepNCP of string * case * comp_type * comp
+  | InfP of aspect
+  | AdvP
+  | FixedP of string
+  | Num of case * acm
+  | Or
+  | Qub
+  (* | Pro
+  | ProNG *)
+  | Null
+  | GerP of case
+  | PrepGerP of string * case
+  | PpasP of case
+  | PrepPpasP of string * case
+  | PactP of case
+
+type phrase_abbr =
+    Xp of string
+  | Advp of string
+  | Nonch
+  | Distrp
+  | Possp
+
+type phrase_comp =
+    Cp
+  | Ncp of case
+  | Prepncp of string * case
+
+type lex =
+    Lexeme of string
+  | ORconcat of lex list
+  | ORcoord of lex list
+  | XOR of lex list
+  | Elexeme of gender
+
+type restr = Natr | Ratr | Ratrs | Ratr1 | Atr | Atr1 | NoRestr
+
+type sel_prefs =
+    SynsetId of int
+  | Predef of string
+  | RelationArgId of string * int (* nazwa relacji * id argumentu ramy *)
+  | RelationRole of string * string * string (* relacji * rola * atrybut roli *)
+
+type position = {psn_id: int; gf: gf; role: string; role_attr: string; sel_prefs: sel_prefs list;
+                 mode: string list; cr: string list; ce: string list; morfs: morf list}
+
+and morf =
+    Phrase of phrase
+  | E of phrase
+  | LexPhrase of (pos * lex) list * (restr * position list)
+  | PhraseAbbr of phrase_abbr * morf list
+  | PhraseComp of phrase_comp * (comp_type * comp list)
+  | MorfId of int
+  | SimpleLexArg of string * pos
+  | LexArg of int * string * pos
+
+let empty_position =
+  {psn_id=(-1); gf=ARG; role=""; role_attr=""; mode=[]; sel_prefs=[]; cr=[]; ce=[]; morfs=[]}
+
+type lex_record = {
+  lex_argument: morf;
+  lex_arguments: morf list;
+  lex_lemma: lex;
+  lex_numeral_lemma: lex;
+  lex_mode: string list;
+  lex_negation: negation;
+  lex_degree: grad;
+  lex_number: number;
+  lex_reflex: refl;
+  lex_gender: gender;
+  lex_modification: restr * position list;
+}
+
+let empty_lex = {lex_argument=Phrase Null; lex_arguments=[]; lex_lemma=Lexeme "";
+                 lex_numeral_lemma=Lexeme ""; lex_mode=[]; lex_negation=NegationUndef;
+                 lex_degree=GradUndef; lex_number=NumberUndef; lex_reflex=ReflUndef;
+                 lex_gender=GenderUndef; lex_modification = Natr,[]}
+
+type meaning = {mng_id: int;
+                name: string;
+                variant: string;
+                plwnluid: int;
+                gloss: string}
+
+let empty_meaning = {mng_id = (-1);
+                     name = "";
+                     variant = "";
+                     plwnluid = (-1);
+                     gloss = ""}
+
+type schema = {sch_id: int; opinion: opinion; reflexiveMark: bool; aspect: aspect;
+               negativity: negation; predicativity: pred; positions: position list; text_rep: string}
+
+type lex_entry =
+    SimpleLexEntry of string * string
+  | LexEntry of int * string * string * restr * position list
+  | ComprepNPEntry of string * restr * position list
+
+
+module OrderedEntry = struct
+  type  t = lex_entry
+  let compare = compare
+end
+
+module EntrySet = Xset.Make(OrderedEntry)
+
+module OrderedAbbr = struct
+  type  t = phrase_abbr
+  let compare = compare
+end
+
+module AbbrMap = Xmap.Make(OrderedAbbr)
+
+module OrderedComp = struct
+  type  t = comp_type
+  let compare = compare
+end
+
+module CompMap = Xmap.Make(OrderedComp)
+
+type example = {exm_id: int;
+                meaning: int;
+                phrases: (int * int * int) list;
+                sentence: string;
+                source: string;
+                opinion: opinion;
+                note: string}
+
+type argument = {arg_id: int;
+                 role: string;
+                 role_attribute: string;
+                 sel_prefs: sel_prefs list}
+
+type frame  = {frm_id: int;
+               opinion: string;
+               meanings: int list;
+               arguments: argument list}
+
+type connection = {argument: int;
+                   phrases: (int * int list) list}
+
+type alternation = {schema: int; frame: int; connections: connection list}
+
+type entry = {ent_id: int;
+              status: string;
+              form_orth: string;
+              form_pos: string;
+              schemata: schema list;
+              examples: example list;
+              frames: frame list;
+              meanings: meaning list;
+              alternations: alternation list}
+
+let empty_entry = {ent_id=(-1); status=""; form_orth=""; form_pos=""; schemata=[]; examples=[];
+                   frames=[]; meanings=[]; alternations=[]}
+(*
+ *  ENIAMwalenty, an interface for Polish Valence Dictionary "Walenty".
+ *  Copyright (C) 2016 Wojciech Jaworski <wjaworski atSPAMfree mimuw dot edu dot pl>
+ *  Copyright (C) 2016 Institute of Computer Science Polish Academy of Sciences
+ *
+ *  This library is free software: you can redistribute it and/or modify
+ *  it under the terms of the GNU Lesser General Public License as published by
+ *  the Free Software Foundation, either version 3 of the License, or
+ *  (at your option) any later version.
+ *
+ *  This library is distributed in the hope that it will be useful,
+ *  but WITHOUT ANY WARRANTY; without even the implied warranty of
+ *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ *  GNU Lesser General Public License for more details.
+ *
+ *  You should have received a copy of the GNU Lesser General Public License
+ *  along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ *)
+
+open Xstd
+
+let empty = StringMap.empty
+
+let add_inc pos_map pos lemma entry =
+  let lemma_map = try StringMap.find pos_map pos with Not_found -> StringMap.empty in
+  let lemma_map = StringMap.add_inc lemma_map lemma [entry] (fun l -> entry :: l) in
+  StringMap.add pos_map pos lemma_map
+
+let add_inc_list pos_map pos lemma entries =
+  let lemma_map = try StringMap.find pos_map pos with Not_found -> StringMap.empty in
+  let lemma_map = StringMap.add_inc lemma_map lemma entries (fun l -> entries @ l) in
+  StringMap.add pos_map pos lemma_map
+
+let flatten_map pos_map f =
+  StringMap.mapi pos_map (fun pos lemma_map ->
+      StringMap.mapi lemma_map (fun lemma entries ->
+          List.flatten (Xlist.rev_map entries (fun entry ->
+              f pos lemma entry))))
+
+let map2 pos_map f =
+  StringMap.mapi pos_map (fun pos lemma_map ->
+      StringMap.mapi lemma_map (fun lemma entries ->
+          f pos lemma entries))
+
+let iter pos_map f =
+  StringMap.iter pos_map (fun pos lemma_map ->
+      StringMap.iter lemma_map (fun lemma entries ->
+          Xlist.iter entries (fun entry ->
+              f pos lemma entry)))
+
+let fold pos_map s f =
+  StringMap.fold pos_map s (fun s pos lemma_map ->
+      StringMap.fold lemma_map s (fun s lemma entries ->
+          Xlist.fold entries s (fun s entry ->
+              f s pos lemma entry)))
@@ -25,11 +25,12 @@ eniam-walenty.cma: $(SOURCES)
 eniam-walenty.cmxa: $(SOURCES)
 	ocamlopt -linkall -a -o eniam-walenty.cmxa $(INCLUDES) $^
  
-test: test.ml
-	$(OCAMLOPT) -o test $(OCAMLOPTFLAGS) test.ml
+test: entries.ml ENIAMwalTypes.ml ENIAMwalParser.ml ENIAMwalReduce.ml test.ml
+	$(OCAMLOPT) -o test $(OCAMLOPTFLAGS) entries.ml ENIAMwalTypes.ml ENIAMwalParser.ml ENIAMwalReduce.ml test.ml
  
-loader: ENIAMwalTypes.ml ENIAMwalStringOf.ml ENIAMwalTEI.ml ENIAMwalConnect.ml ENIAMwalRealizations.ml ENIAMwalLex.ml
-	$(OCAMLOPT) -o loader $(OCAMLOPTFLAGS) ENIAMwalTypes.ml ENIAMwalStringOf.ml ENIAMwalTEI.ml ENIAMwalConnect.ml ENIAMwalRealizations.ml ENIAMwalLex.ml
+loader: entries.ml ENIAMwalTypes2.ml ENIAMwalStringOf.ml ENIAMwalTEI.ml ENIAMwalConnect.ml ENIAMwalRealizations.ml ENIAMwalLex.ml ENIAMwalGenerate.ml
+	mkdir -p results
+	$(OCAMLOPT) -o loader $(OCAMLOPTFLAGS) entries.ml ENIAMwalTypes2.ml ENIAMwalStringOf.ml ENIAMwalTEI.ml ENIAMwalConnect.ml ENIAMwalRealizations.ml ENIAMwalLex.ml ENIAMwalGenerate.ml
  
 .SUFFIXES: .mll .mly .ml .mli .cmo .cmi .cmx
  
@@ -18,7 +18,7 @@
  *)
  
 open Xstd
-
+(*
 let test_strings = [
   ["chłopiec","subst"; "maić","fin"; "ulica","subst"; "kwiat","subst"]
   ]
@@ -50,3 +50,4 @@ let _ =
     s := read_line ()
   done;*)
   ()
+*)