Analiza controli w Walentym

Wojciech Jaworski
1 parent d102eb5a
Showing 16 changed files with 94 additions and 260 deletions
LCGlexicon/ENIAMcategoriesPL.ml
LCGlexicon/TODO
LCGlexicon/resources/lexicon-pl.dic
lexSemantics/ENIAMlexSemantics.ml
lexSemantics/ENIAMlexSemanticsData.ml
lexSemantics/ENIAMvalence.ml
lexSemantics/ENIAMwalRenderer.ml
semantics/ENIAMsemGraph.ml
semantics/ENIAMsemLexicon.ml
semantics/ENIAMsemValence.ml
semantics/resources/lexicon-pl.dic
testy/testy_podstawowe.txt
walenty/.gitignore
walenty/ENIAMwalGenerate.ml
walenty/ENIAMwalTEI.ml
walenty/makefile
@@ -86,6 +86,7 @@ let subst_time_lexemes = ref StringSet.empty
  
 let subst_pronoun_lexemes = StringSet.of_list ["co"; "kto"; "cokolwiek"; "ktokolwiek"; "nic"; "nikt"; "coś"; "ktoś"; "to"]
 let adj_pronoun_lexemes = StringSet.of_list ["czyj"; "jaki"; "który"; "jakiś"; "ten"; "taki"]
+let compar_lexemes = StringSet.of_list ["jak"; "jako"; "niż"; "niczym"; "niby"; "co"; "zamiast"]
  
 (* let adj_quant_lexemes = StringSet.of_list ["każdy"; "wszelki"; "wszystek"; "żaden"; "jakiś"; "pewien"; "niektóry"; "jedyny"; "sam"] *)
  
@@ -200,12 +201,12 @@ let clarify_categories proper cat = function
       let cases = expand_cases cases in
       [{empty_cats with lemma=lemma; pos="siebie"; pos2="pron"; numbers=all_numbers; cases=cases; genders=all_genders; persons=["ter"]}]
   | lemma,"prep",[cases;woks] ->
-      if lemma = "jak" || lemma = "jako" || lemma = "niż" || lemma = "niczym" || lemma = "niby" || lemma = "co" || lemma = "zamiast" then
+      if StringSet.mem compar_lexemes lemma then
         [{empty_cats with lemma=lemma; pos="compar"; pos2="prep"}] else
       let cases = expand_cases cases in
       [{empty_cats with lemma=lemma; pos="prep"; pos2="prep"; cases=cases}]
   | lemma,"prep",[cases] ->
-      if lemma = "jak" || lemma = "jako" || lemma = "niż" || lemma = "niczym" || lemma = "niby" || lemma = "co" || lemma = "zamiast" then
+      if StringSet.mem compar_lexemes lemma then
         [{empty_cats with lemma=lemma; pos="compar"; pos2="prep"}] else
       let cases = expand_cases cases in
       [{empty_cats with lemma=lemma; pos="prep"; pos2="prep"; cases=cases}]
+- day-lex nie jest argumentem w żadnej regule
+
 - dodać uzgodnienie policzalności liczebnika i rzeczownika
  
 - dodac prepncp
@@ -105,7 +105,10 @@ lemma=jakiś|ten|taki,pos=apron:
  
 # liczebniki
 # FIXME: liczba po rzeczowniku  # FIXME: zbadać jak liczebniki współdziałąją z jako COMPAR
-pos=num|intnum|realnum|intnum-interval|realnum-interval:
+# dwie reguły są potrzebne po to, żeby w ENIAMsemValence.match_value nie pojawiał się variant
+pos=num|intnum|realnum|intnum-interval|realnum-interval,nsem=count:
+  num*number*case*gender*person*acm*nsem{\(1+qub),/(1+inclusion)}; # FIXME: jak usunięcie Phrase ProNG wpływa na pokrycie?
+pos=num|intnum|realnum|intnum-interval|realnum-interval,nsem=mass:
   num*number*case*gender*person*acm*nsem{\(1+qub),/(1+inclusion)}; # FIXME: jak usunięcie Phrase ProNG wpływa na pokrycie?
  
 # pojemniki
@@ -138,7 +141,7 @@ lemma=w,pos=prep,case=loc:      prepnp*lemma*case{\(1+advp*T),/(day-month+day+ye
  
 # komparatywy
 # FIXME: trzeba poprawić comparnp i comparpp w walencji
-pos=compar: QUANT[case=nom&gen&dat&acc&inst] compar*lemma*case{\(1+advp*T),/np*T*case*T*T}{\(1+qub),/(1+inclusion)};
+pos=compar: QUANT[case=nom&gen&dat&acc&inst] compar*lemma*case{\(1+advp*T),/(np*T*case*T*T+adjp*T*case*T)}{\(1+qub),/(1+inclusion)};
 pos=compar: QUANT[case=postp] compar*lemma*case{\(1+advp*T),/(prepnp*T*T+prepadjp*T*T)}{\(1+qub),/(1+inclusion)};
  
 # frazy przymiotnikowe
@@ -205,6 +205,20 @@ let mark_nosem frame =
     else p))}
  
 let assign_prep_semantics lemma =
+  if StringSet.mem ENIAMcategoriesPL.compar_lexemes lemma then
+    [{empty_frame with
+      meanings = [find_prep_meaning lemma [Predef "ALL"]];
+      positions= [{empty_position with
+        dir=Forward_; gf=CORE;
+        morfs=ENIAMwalRenderer.compar_morfs; is_necessary=Req}];
+      agf="arg"};
+    {empty_frame with
+      meanings = [find_prep_meaning lemma [Predef "ALL"]];
+      positions= [{empty_position with
+        sel_prefs=[SynsetName "ALL"]; dir=Forward_; gf=CORE;
+        morfs=ENIAMwalRenderer.compar_morfs; is_necessary=Req}];
+      arole="Arg"; arole_attr=""; arev=false; agf="adjunct"}]
+  else
   let roles = try StringMap.find ENIAMlexSemanticsData.prep_roles lemma with Not_found -> [] in
   (* Printf.printf "assign_prep_semantics: |roles|=%d\n%!" (Xlist.size roles); *)
   {empty_frame with
@@ -213,6 +227,14 @@ let assign_prep_semantics lemma =
       dir=if lemma="temu" then Backward_ else Forward_; gf=CORE;
       morfs=ENIAMwalRenderer.prep_morfs; is_necessary=Req}];
     agf="arg"} ::
+  (if roles = [] then (* FIXME: zaślepka do usunięcia po stworzeniu listy przyimków *)
+  [{empty_frame with
+    meanings = [find_prep_meaning lemma [Predef "ALL"]];
+    positions= [{empty_position with
+      sel_prefs=[SynsetName "ALL"]; dir=if lemma="temu" then Backward_ else Forward_; gf=CORE;
+      morfs=ENIAMwalRenderer.prep_morfs; is_necessary=Req}];
+    arole="Arg"; arole_attr=""; arev=false; agf="adjunct"}]
+  else
   Xlist.map roles (function (case,arole,arole_attr,hipero,sel_prefs) ->
     (* Printf.printf "assign_prep_semantics: case=%s arole=%s arole_attr=%s\n%!" case arole arole_attr; *)
     let meaning = find_prep_meaning lemma hipero in (* FIXME: zaślepka dla meaning i weight *)
@@ -222,7 +244,7 @@ let assign_prep_semantics lemma =
       morfs=ENIAMwalRenderer.prep_morfs(*ENIAMwalRenderer.assing_prep_morfs (lemma,case)*); is_necessary=Req}] in
     (* print_endline "assign_prep_semantics 2"; *)
     {empty_frame with selectors=[ENIAM_LCGlexiconTypes.Case,ENIAM_LCGlexiconTypes.Eq,[case]]; meanings=[meaning]; positions=find_selprefs positions;
-     arole=arole; arole_attr=arole_attr; arev=false; agf="adjunct"})
+     arole=arole; arole_attr=arole_attr; arev=false; agf="adjunct"}))
  
 let assign_num_semantics lemma =
   let sems = try StringMap.find !num_sem lemma with Not_found -> [] in
@@ -369,7 +391,7 @@ let disambiguate_senses lex_sems group =
       Xlist.fold frame.positions prefs (fun prefs t ->
         Xlist.fold t.sel_prefs prefs (fun prefs -> function
           SynsetName s -> StringSet.add prefs s
-        | _ -> failwith "disambiguate_senses")))) in
+        | t -> failwith ("disambiguate_senses: " ^ ENIAMwalStringOf.sel_prefs t))))) in
   (*let hipero = Xlist.fold group (StringSet.singleton "ALL") (fun hipero id ->
     Xlist.fold (ExtArray.get lex_sems id).senses hipero (fun hipero (_,l,_) ->
       Xlist.fold l hipero StringSet.add)) in
@@ -267,19 +267,19 @@ let prep_roles = Xlist.fold [ (* lemma,case,role,role_attr,meaning/hipero,sel_pr
   "przed","acc",	"Location","Goal",["POŁOŻENIE"],["POŁOŻENIE"];
   "w","acc",		"Location","Goal",["POŁOŻENIE"],["POŁOŻENIE"];
   "za","acc",		"Location","Goal",["POŁOŻENIE"],["POŁOŻENIE"];
-  "dzięki","dat",	"Condition","",["CZEMU"],[];
-  "na","acc",		"Condition","",["CZEMU"],[];
-  "na","postp",		"Condition","",["CZEMU"],[];
-  "od","gen",		"Condition","",["CZEMU"],[];
-  "przez","acc",	"Condition","",["CZEMU"],[];
-  "wskutek","gen",	"Condition","",["CZEMU"],[];
-  "z","gen",		"Condition","",["CZEMU"],[];
-  "dla","gen",		"Purpose","",["CZEMU"],[];
-  "do","gen",		"Purpose","",["CZEMU"],[];
-  "ku","dat",		"Purpose","",["CZEMU"],[];
-  "na","acc",		"Purpose","",["CZEMU"],[];
-  "na","postp",		"Purpose","",["CZEMU"],[];
-  "po","acc",		"Purpose","",["CZEMU"],[];
+  "dzięki","dat",	"Condition","",["CZEMU"],["ALL"];
+  "na","acc",		"Condition","",["CZEMU"],["ALL"];
+  "na","postp",		"Condition","",["CZEMU"],["ALL"];
+  "od","gen",		"Condition","",["CZEMU"],["ALL"];
+  "przez","acc",	"Condition","",["CZEMU"],["ALL"];
+  "wskutek","gen",	"Condition","",["CZEMU"],["ALL"];
+  "z","gen",		"Condition","",["CZEMU"],["ALL"];
+  "dla","gen",		"Purpose","",["CZEMU"],["ALL"];
+  "do","gen",		"Purpose","",["CZEMU"],["ALL"];
+  "ku","dat",		"Purpose","",["CZEMU"],["ALL"];
+  "na","acc",		"Purpose","",["CZEMU"],["ALL"];
+  "na","postp",		"Purpose","",["CZEMU"],["ALL"];
+  "po","acc",		"Purpose","",["CZEMU"],["ALL"];
   "do","gen",		"Duration","",["CZAS"],["CZAS"];
   "od","gen",		"Duration","",["CZAS"],["CZAS"];
   "przez","acc",	"Duration","",["CZAS"],["CZAS"];
@@ -326,13 +326,13 @@ let prep_roles = Xlist.fold [ (* lemma,case,role,role_attr,meaning/hipero,sel_pr
   "wedle","gen",	"Location","",["POŁOŻENIE"],["POŁOŻENIE"];
   "wpośród","gen",	"Location","",["POŁOŻENIE"],["POŁOŻENIE"];
   "wśrzód","gen",	"Location","",["POŁOŻENIE"],["POŁOŻENIE"];
-  "po","postp",		"Manner","",["ALL"],[];
-  "bez","gen",		"Manner","",["ALL"],[];
+  "po","postp",		"Manner","",["ALL"],["ALL"];
+  "bez","gen",		"Manner","",["ALL"],["ALL"];
 (*  "jako","str",	"Manner","",[],[];
   "jak","str",		"Manner","",[],[];*)
-  "pod","acc",		"Manner","",["ALL"],[];
-  "z","inst",		"Manner","",["ALL"],[];
-  "z","postp",		"Manner","",["ALL"],[];
+  "pod","acc",		"Manner","",["ALL"],["ALL"];
+  "z","inst",		"Manner","",["ALL"],["ALL"];
+  "z","postp",		"Manner","",["ALL"],["ALL"];
   "dokoła","gen",	"Path","",["POŁOŻENIE"],["POŁOŻENIE"];
   "dookoła","gen",	"Path","",["POŁOŻENIE"],["POŁOŻENIE"];
   "koło","gen",		"Path","",["POŁOŻENIE"],["POŁOŻENIE"];
@@ -368,9 +368,10 @@ let prep_roles = Xlist.fold [ (* lemma,case,role,role_attr,meaning/hipero,sel_pr
   "w","loc",		"Time","",["CZAS"],["CZAS"];
   "temu","acc",		"Time","",["CZAS"],["CZAS"]; (* dodane *)
   "za","gen",		"Time","",["CZAS"],["CZAS"]; (* dodane *)
+  "o","acc",		"Arg","",["ALL"],["ALL"]; (* FIXME: zaślepka *)
   ] StringMap.empty (fun map (lemma,case,role,role_attr,hipero,sel_prefs) ->
       let hipero = Xlist.map hipero (fun hipero -> ENIAMwalTypes.Predef hipero) in
-      let sel_prefs = Xlist.map sel_prefs (fun sel_prefs -> ENIAMwalTypes.Predef sel_prefs) in
+      let sel_prefs = Xlist.map sel_prefs (fun sel_prefs -> ENIAMwalTypes.SynsetName sel_prefs) in
       StringMap.add_inc map lemma [case,role,role_attr,hipero,sel_prefs]
         (fun l -> (case,role,role_attr,hipero,sel_prefs) :: l))
 (*  "przeciwko","dat","Dat";
@@ -641,6 +641,7 @@ let get_aroles schema lemma = function
       | "perl" -> ([Mode,Eq,["perl"]],"Path","",false) :: l
       | "dur" -> ([Mode,Eq,["dur"]],"Duration","",false) :: l
       | "temp" -> ([Mode,Eq,["temp"]],"Time","",false) :: l
+      | "pron" -> ([Mode,Eq,["mod"]],"Manner","",false) :: l
       | _ -> failwith "get_aroles")
   | "qub" ->
       let l = try StringMap.find ENIAMlexSemanticsData.qub_roles lemma with Not_found -> ["Arg",""] in
@@ -363,3 +363,10 @@ let prep_morfs = [
   LCG(Tensor[Atom "day"]);
   LCG(Tensor[Atom "date"]);
   ]
+
+let compar_morfs = [
+  LCG(Tensor[Atom "np"; Top; Atom "case"; Top; Top]);
+  LCG(Tensor[Atom "adjp"; Top; Atom "case"; Top]);
+  LCG(Tensor[Atom "prepnp"; Top; Top]);
+  LCG(Tensor[Atom "prepadjp"; Top; Top]);
+  ]
@@ -94,6 +94,8 @@ let create_normal_concept (*roles role_attrs*) tokens lex_sems t =
       | "NSYN",Val "pronoun" -> c(*{c with c_quant=Tuple[c.c_quant;Val "indexical"]}*),measure,cx_flag
       | "NSEM",Val "count" -> c(*{c with c_quant=Tuple[c.c_quant;Val "count"]}*),measure,cx_flag
       | "NSEM",Val "mass" -> {c with c_quant=Tuple[c.c_quant;Val "mass"]},measure,cx_flag
+      | "NSEM",Variant(e,[a,Val "mass";b,Val "count"]) -> {c with c_quant=Tuple[c.c_quant;Variant(e,[a,Val "mass";b,Val "count"])]},measure,cx_flag (* FIXME: tu by należało podzielić to na dwa pudełka *)
+      | "NSEM",Variant(e,[a,Val "count";b,Val "mass"]) -> {c with c_quant=Tuple[c.c_quant;Variant(e,[a,Val "count";b,Val "mass"])]},measure,cx_flag
       | "NSEM",Val "measure" -> c,true,cx_flag
       | "NSEM",Val "time" -> c,measure,cx_flag(*failwith "create_normal_concept: time"*)
       | "NUM",t -> {c with c_quant=Tuple[c.c_quant;t]},measure,cx_flag
@@ -110,7 +112,7 @@ let create_normal_concept (*roles role_attrs*) tokens lex_sems t =
       | "LEX",_ -> c,measure,cx_flag (* FIXME *) *)
 (*       | "TYPE",Val "int" -> {c with c_quant=Tuple[c.c_quant;Val "interrogative"]},measure *)
       (* | "TYPE",_ -> c,measure,cx_flag (* FIXME *) *)
-      | e,t -> failwith ("create_normal_concept noun: " ^ e)) in
+      | e,t -> failwith ("create_normal_concept noun: " ^ e ^ ": " ^ ENIAMsemStringOf.linear_term 0 t)) in
     (* let c = if t.pos = "depr" then {c with c_relations=Tuple[c.c_relations;SingleRelation(Val "depr")]} else c in *)
     if cx_flag then
       let id = ExtArray.add tokens ENIAMtokenizerTypes.empty_token_env in
@@ -65,6 +65,8 @@ let parse_role p = function
     "adjunct" -> {p with gf=ADJUNCT}
   | "unk" -> {p with role="unk"}
   | "nosem" -> {p with gf=NOSEM}
+  | "Poss" -> {p with role="Poss"; sel_prefs=[SynsetName "ALL"]}
+  | "Coref" -> {p with role="Coref"; sel_prefs=[SynsetName "ALL"]}
   | "Count" -> {p with role="Count"; sel_prefs=[SynsetName "ALL"]}
   | "Measure" -> {p with role="Measure"; sel_prefs=[SynsetName "ALL"]}
   | s -> failwith ("parse_role: " ^ s)
@@ -278,8 +278,8 @@ let rec assign_frames_rec tokens lex_sems tree arg_symbols visited = function
       let s = ExtArray.get lex_sems t.id in
       let symbol = get_phrase_symbol t.symbol in
       let frames = Xlist.fold s.ENIAMlexSemanticsTypes.frames [] (fun frames frame ->
-        print_endline ("selectors: " ^ ENIAMcategoriesPL.string_of_selectors frame.selectors);
-        Printf.printf "assign_frames_rec: lemma=%s positions=[%s]\n%!" t.lemma (ENIAMwalStringOf.schema frame.positions);
+        (* print_endline ("selectors: " ^ ENIAMcategoriesPL.string_of_selectors frame.selectors); *)
+        (* Printf.printf "assign_frames_rec: lemma=%s positions=[%s]\n%!" t.lemma (ENIAMwalStringOf.schema frame.positions); *)
         try
           let attrs = apply_selectors t.attrs frame.selectors in
           let frame = ENIAMsemLexicon.extend_frame symbol frame in
@@ -380,14 +380,21 @@ exception AGF
  
 let rec manage_agf = function
   | Node t ->
+      (* print_endline ("manage_agf 1 " ^ ENIAM_LCGstringOf.linear_term 0 (Node t)); *)
       let attrs,agf = try extract_attr "agf" [] t.attrs with Not_found -> failwith "manage_agf" in
+      (* print_endline "manage_agf 2"; *)
       let gf = try get_attr "gf" t.attrs with Not_found -> Dot in (* FIXME: to by się chyba przydało poprawić, żeby gf było zawsze ustalone *)
+      (* print_endline "manage_agf 3"; *)
       if agf = Val "" || agf=gf then Node{t with attrs=attrs} else raise AGF
   | Variant(e,l) ->
+      (* print_endline ("manage_agf 4: " ^ ENIAM_LCGstringOf.linear_term 0 (Variant(e,l))); *)
       let l = Xlist.fold l [] (fun l (i,t) -> try (i, manage_agf t) :: l with AGF -> l) in
+      (* print_endline ("manage_agf 5: " ^ ENIAM_LCGstringOf.linear_term 0 (Variant(e,l))); *)
       if l = [] then raise AGF else Variant(e,List.rev l)
   | Tuple l ->
+      (* print_endline "manage_agf 6"; *)
       let l = Xlist.rev_map l manage_agf in
+      (* print_endline "manage_agf 7"; *)
       Tuple(List.rev l)
   | Dot -> Dot
   | t -> failwith ("cut_nodes: " ^ ENIAM_LCGstringOf.linear_term 0 t)
@@ -408,7 +415,7 @@ let rec reduce_tree_rec tokens lex_sems result_tree mid_tree orig_tree = functio
   | Node t ->
       let args = reduce_tree_rec tokens lex_sems result_tree mid_tree orig_tree t.args in
       (* print_endline ("reduce_tree_rec 1: " ^ ENIAM_LCGstringOf.linear_term 0 args); *)
-      let args = try manage_agf args with AGF -> failwith "reduce_tree_rec: AGF" in
+      let args = try manage_agf args with AGF -> failwith "reduce_tree_rec: AGF" in (* FIXME: to nie musi być błąd, należałoby przechwytywać wyjątek na poziorie wariantu powyżej *)
       let args = cut_nodes result_tree args in
       (* print_endline ("reduce_tree_rec 2: " ^ ENIAM_LCGstringOf.linear_term 0 args); *)
       (*let id =
  
 day-lex:      /(date+day+day-month):unk;
 date:         /(1+year-lex):unk;
-day:          /month-lex:unk;
-day-interval: /month-lex:unk;
-day-month:    /(1+year-lex):unk;
+day:          /month-lex:Poss;
+day-interval: /month-lex:Poss;
+day-month:    /(1+year-lex):Poss;
 year-lex:     |(1+adjp*number*case*gender):unk;
-month-lex:    /(1+year+np*T*gen*T*T):unk;
+month-lex:    /(1+year+np*T*gen*T*T):Poss;
  
 date-interval:        null;
 day-month-interval:   null;
@@ -26,8 +26,8 @@ email:                null;
 np:
   \(1+num*number*case*gender*person*congr*nsem+num*number*case*gender*person*rec*nsem):adjunct \(1+qub):adjunct /(1+inclusion):adjunct
   \(1+measure*unumber*ucase*ugender*uperson):Measure
-  /(1+date+day+day-month+date-interval+day-interval+day-month-interval+year+year-interval+hour+hour-minute+hour-interval+hour-minute-interval):unk
-  |(1+year):unk /(1+obj-id):unk;
+  /(1+date+day+day-month+date-interval+day-interval+day-month-interval+year+year-interval+hour+hour-minute+hour-interval+hour-minute-interval+roman+roman-interval):Coref
+  |(1+year):unk /(1+obj-id):Coref;
  
 num: \(1+qub):adjunct /(1+inclusion):adjunct;
  
@@ -200,3 +200,4 @@ Ala zjadła kota.
 Kot wyszedł spod komody.
 Aranżuję na kilka fortepianów.
 Aranżuję na wiele fortepianów.
+Wiele wody płynie.
 converter
 results/*.tab
+analyze
@@ -167,223 +167,3 @@ let _ =
     print_meanings "resources/meanings.tab" meanings;
     print_adv_types "resources/adv_modes.tab" adv_types;
     ())
-
-(* Test wczytywania Walentego TEI *)
-(* let _ =
-   let walenty,phrases = ENIAMwalTEI.load_walenty "/home/yacheu/Dokumenty/NLP resources/Walenty/walenty_20170311.xml" in
-   let n = Xlist.fold ENIAMwalTEI.walenty 0 (fun n e -> let l = connect e in n + Xlist.size l) in
-   let m = Xlist.fold ENIAMwalTEI.walenty 0 (fun n e -> let l = schemata e in n + Xlist.size l) in
-   Printf.printf "%d connected\n%d schemata\n|phrases|=%d\n" n m (IntMap.size phrases);
-   () *)
-
-(* Test unikalności indeksów sensów *)
-(* let _ =
-  let walenty,phrases = ENIAMwalTEI.load_walenty "/home/yacheu/Dokumenty/NLP resources/Walenty/walenty_20170311.xml" in
-  Xlist.fold walenty IntMap.empty (fun map e ->
-    Xlist.fold e.meanings map (fun map m ->
-      IntMap.add_inc map m.mng_id m (fun m1 -> if m1 = m then m else failwith "meaning"))) *)
-
-(*
-(* let insert_phrases phrases = function
-    Frame(atrs,s) -> Frame(atrs,Xlist.map s (fun p ->
-      {p with morfs=Xlist.map p.morfs (function
-             MorfId id -> (try IntMap.find phrases id with Not_found -> failwith "insert_phrases")
-           | _ -> failwith "insert_phrases")}))
-  | _ -> failwith "insert_phrases: ni"
-
-let print_entry pos_map pos orth =
-  let orth_map = try StringMap.find pos_map pos with Not_found -> StringMap.empty in
-  let frames = try StringMap.find orth_map orth with Not_found -> [] in
-  Xlist.iter frames (fun frame ->
-      let frame = insert_phrases ENIAMwalTEI.phrases frame in
-      print_endline (ENIAMwalStringOf.frame orth frame)) *)
-
-(* Wypisanie hasła *)
-(* let _ =
-   print_entry connected_walenty "verb" "brudzić";
-   () *)
-
-(* let has_nontrivial_lex = function
-    Frame(atrs,s) -> Xlist.fold s false (fun b p ->
-      if p.role = "Lemma" && p.role_attr = "" then b else
-        Xlist.fold p.morfs b (fun b -> function
-              MorfId id -> failwith "has_nontrivial_lex"
-            | LexPhrase _ -> true
-            (* | LexRPhrase _ -> true
-               | LexPhraseMode _ -> true *)
-            | _ -> b))
-  | _ -> failwith "has_nontrivial_lex: ni" *)
-
-(* Leksykalizacje nie wchodzące do lematu *)
-(* let _ =
-   StringMap.iter connected_walenty (fun _ orth_map ->
-      StringMap.iter orth_map (fun orth frames ->
-          Xlist.iter frames (fun frame ->
-              let frame = insert_phrases ENIAMwalTEI.phrases frame in
-              if has_nontrivial_lex frame then
-                print_endline (ENIAMwalStringOf.frame orth frame)))) *)
-
-let simplify_frame_verb = function
-    Phrase(NP(Case "dat")) -> []
-  | Phrase(NP(Case "inst")) -> []
-  | Phrase(PrepNP _) -> []
-  | Phrase(ComprepNP _) -> []
-  | Phrase(AdvP) -> []
-  | t -> [t]
-
-let simplify_frame_noun = function
-    Phrase(NP(Case "gen")) -> []
-  | Phrase(NP(Case "nom")) -> []
-  | Phrase(NP(CaseAgr)) -> []
-  | Phrase(PrepNP _) -> []
-  | Phrase(ComprepNP _) -> []
-  | Phrase(AdjP CaseAgr) -> []
-  | PhraseComp(Ncp(Case "gen"),_)
-  | PhraseComp(Prepncp(_,_),_) -> []
-  | PhraseAbbr(Possp,[]) -> []
-  | t -> [t]
-
-let simplify_frame_adj = function
-  | t -> [t]
-
-let simplify_frame_adv = function
-  | t -> [t]
-
-
-(* let simplify_frame pos = function
-    Frame(atrs,s) ->
-    let schema = Xlist.fold s [] (fun schema p ->
-        let morfs = Xlist.fold p.morfs [] (fun morfs morf ->
-            match pos with
-              "verb" -> simplify_frame_verb morf @ morfs
-            | "noun" -> simplify_frame_noun morf @ morfs
-            | "adj" -> simplify_frame_adj morf @ morfs
-            | "adv" -> simplify_frame_adv morf @ morfs
-            | _ -> failwith "simplify_frame") in
-        if morfs = [] then schema else
-          {p with ce=[]; cr=[]; morfs=morfs} :: schema) in
-    if schema = [] then [] else [Frame(atrs,schema)]
-  | _ -> failwith "simplify_frame: ni" *)
-
-
-(* Uproszczone schematy *)
-(* let _ =
-   StringMap.iter schemata_walenty (fun pos orth_map ->
-      if pos = "noun" then
-      StringMap.iter orth_map (fun orth frames ->
-          Xlist.iter frames (fun frame ->
-              let frame = insert_phrases ENIAMwalTEI.phrases frame in
-              let frames = simplify_frame pos frame in
-              Xlist.iter frames (fun frame -> print_endline (ENIAMwalStringOf.frame orth frame))))) *)
-
-(* let has_mode_coordination = function
-    Frame(atrs,s) -> Xlist.fold s false (fun b p ->
-      let n = Xlist.fold p.morfs 0 (fun n -> function
-            MorfId id -> failwith "has_nontrivial_lex"
-          | PhraseAbbr(Advp _,_) -> n+1
-          | PhraseAbbr(Xp _,_) -> n+1
-          (* | LexPhraseMode _ -> n+1 FIXME*)
-          | _ -> n) in
-      if n>1 then true else b)
-  | _ -> failwith "has_nontrivial_lex: ni" *)
-
-(* Koordynacja z mode *)
-(* let _ =
-   StringMap.iter schemata_walenty(*connected_walenty*) (fun _ orth_map ->
-      StringMap.iter orth_map (fun orth frames ->
-          Xlist.iter frames (fun frame ->
-              let frame = insert_phrases ENIAMwalTEI.phrases frame in
-              if has_mode_coordination frame then
-                print_endline (ENIAMwalStringOf.frame orth frame)))) *)
-
-
-(* let get_entry orth pos *)
-     (*
-let load_walenty2 () =
-  let walenty = load_walenty walenty_filename in
-  Xlist.fold walenty StringMap.empty (fun walenty entry ->
-    if entry.frames = [] then Xlist.fold (connect2 entry) walenty (fun walenty (lemma,pos,frame) ->
-      let map = try StringMap.find walenty pos with Not_found -> StringMap.empty in
-      let map = StringMap.add_inc map lemma [frame] (fun l -> frame :: l) in
-      StringMap.add walenty pos map)
-    else Xlist.fold (connect entry) walenty (fun walenty (lemma,pos,frame) ->
-      let map = try StringMap.find walenty pos with Not_found -> StringMap.empty in
-      let map = StringMap.add_inc map lemma [frame] (fun l -> frame :: l) in
-      StringMap.add walenty pos map))
-
-
-let print_stringqmap filename qmap =
-  let l = StringQMap.fold qmap [] (fun l k v -> (v,k) :: l) in
-  File.file_out filename (fun file ->
-    Xlist.iter (Xlist.sort l compare) (fun (v,k) ->
-      Printf.fprintf file "%5d %s\n" v k))
-
-let sel_prefs_quantities walenty =
-  Xlist.fold walenty StringQMap.empty (fun quant e ->
-    Xlist.fold e.frames quant (fun quant f ->
-      Xlist.fold f.arguments quant (fun quant a ->
-        Xlist.fold a.sel_prefs quant (fun quant l ->
-          Xlist.fold l quant (fun quant -> function
-              Numeric s ->
-                let name = try ENIAMplWordnet.synset_name s with Not_found -> "unknown" in
-                StringQMap.add quant ("N " ^ s ^ " " ^ name)
-            | Symbol s -> StringQMap.add quant ("S " ^ s)
-            | Relation(s,t) -> StringQMap.add quant ("R " ^ s ^ " | " ^ t))))))
-*)
-(*let _ =
-  let walenty = load_walenty walenty_filename in
-  let quant = sel_prefs_quantities walenty in
-  print_stringqmap "results/quant_sel_prefs.txt" quant*)
-
-(*let _ =
-  let walenty = load_walenty2 () in
-  let frames_sem = try StringMap.find (StringMap.find walenty "verb") "bębnić" with Not_found -> failwith "walTEI" in
-  Xlist.iter frames_sem (fun frame ->
-    print_endline (WalStringOf.frame "bębnić" frame))*)
-
-
-(* Wypisanie realizacji *)
-(* let _ =
-   Xlist.iter ENIAMwalTEI.expands (fun (id,morf,l) ->
-      Printf.printf "%d %s:\n" id (ENIAMwalStringOf.morf morf);
-      Xlist.iter l (fun morf -> Printf.printf "    %s\n" (ENIAMwalStringOf.morf morf))) *)
-
-(* Wypisanie realizacji po przetworzeniu *)
-(* let _ =
-   AbbrMap.iter expands (fun morf l ->
-      Printf.printf "%s:\n" (ENIAMwalStringOf.phrase_abbr morf);
-      Xlist.iter l (fun morf -> Printf.printf "    %s\n" (ENIAMwalStringOf.morf morf))) *)
-
-let has_realization = function
-    PhraseAbbr _ -> true
-  | PhraseComp _ -> true
-  | _ -> false
-
-(* Wypisanie fraz, które podlegają rozwijaniu *)
-(*let _ =
-  IntMap.iter ENIAMwalTEI.phrases (fun i morf ->
-      if has_realization morf then
-      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf morf)) *)
-
-(* Wypisanie fraz, które podlegają rozwijaniu *)
-(* let _ =
-   IntMap.iter phrases (fun i morf ->
-      if has_realization morf then
-      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf morf)) *)
-
-(* let test_phrases = [17088; 17133; 1642]
-   let _ =
-   Xlist.iter test_phrases (fun i ->
-      let m1 = IntMap.find ENIAMwalTEI.phrases i in
-      let m2 = IntMap.find phrases i in
-      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf m1);
-      Printf.printf "%4d %s\n" i (ENIAMwalStringOf.morf m2)) *)
-
-(* let print_entries entries =
-  StringMap.iter entries (fun pos entries2 ->
-      StringMap.iter entries2 (fun lemma entries3 ->
-          EntrySet.iter entries3 (fun entry ->
-              Printf.printf "%s: %s: %s\n" pos lemma (ENIAMwalStringOf.entry entry)))) *)
-
-(* let _ = print_entries entries *)
-*)
@@ -86,9 +86,9 @@ let parse_gf = function
  
 let parse_control arg = function
     "controller" -> {arg with cr="1" :: arg.cr}
-  | "controllee" -> {arg with ce="1" :: arg.cr}
+  | "controllee" -> {arg with ce="1" :: arg.ce}
   | "controller2" -> {arg with cr="2" :: arg.cr}
-  | "controllee2" -> {arg with ce="2" :: arg.cr}
+  | "controllee2" -> {arg with ce="2" :: arg.ce}
   | s -> failwith ("parse_control: " ^ s)
  
 let parse_case = function
@@ -6,11 +6,15 @@ OCAMLFLAGS=$(INCLUDES) -g
 OCAMLOPTFLAGS=$(INCLUDES) unix.cmxa xml-light.cmxa str.cmxa nums.cmxa zip.cmxa bz2.cmxa xlib.cmxa
 INSTALLDIR=`ocamlc -where`/eniam
  
-SOURCES=entries.ml ENIAMwalTypes.ml ENIAMwalStringOf.ml ENIAMwalTEI.ml ENIAMwalConnect.ml ENIAMwalRealizations.ml ENIAMwalLex.ml ENIAMwalGenerate.ml
+SOURCES=entries.ml ENIAMwalTypes.ml ENIAMwalStringOf.ml ENIAMwalTEI.ml ENIAMwalConnect.ml ENIAMwalRealizations.ml ENIAMwalLex.ml
  
-all: $(SOURCES)
+all: $(SOURCES) ENIAMwalGenerate.ml
 	$(OCAMLOPT) -o converter $(OCAMLOPTFLAGS) $^
  
+analyze: $(SOURCES) ENIAMwalAnalyze.ml
+	mkdir -p results
+	$(OCAMLOPT) -o analyze $(OCAMLOPTFLAGS) $^
+
 install:
 	mkdir -p /usr/share/eniam/Walenty
 	cp resources/*  /usr/share/eniam/Walenty
@@ -40,4 +44,4 @@ install-local:
 	$(OCAMLOPT) $(OCAMLOPTFLAGS) -c $<
  
 clean:
-	rm -f *~ *.cm[aoix] *.o *.so *.cmxa *.a converter resources/*.tab
+	rm -f *~ *.cm[aoix] *.o *.so *.cmxa *.a converter analyze resources/*.tab results/*