bardziej zmodyfikowany import SGJP

janek37
1 parent 3eabc2ee
Showing 3 changed files with 262 additions and 209 deletions
dictionary/management/commands/import_data.py
dictionary/models.py
dictionary/templates/inflection_table.html
@@ -4,7 +4,6 @@ import sqlite3
 import datetime
 from django.db import connection, transaction
 from django.core.management.base import BaseCommand
-from django.contrib.auth.models import User
  
 from common.util import no_history
 from dictionary.models import *
@@ -12,12 +11,13 @@ from dictionary.models import *
 DEFAULT_DATABASE = 'data/sgjp.db'
  
 MINI_MODE = True # do debugowania
-MINI_LEXEME_COUNT = 500
+MINI_LEXEME_COUNT = 40000
 MINI_LEXEME_QUERY = 'SELECT %s FROM leksemy LIMIT ?'
  
-# UWAGA: aktualnie ustawienie SQL_MODE = False jest niekompletne
 SQL_MODE = True
  
+BATCH_SIZE = 5000
+
 OTHER = 'inne'
 DEFAULT_VOCAB = 'SGJP'
  
@@ -60,6 +60,9 @@ def get_cursor(db):
   conn.row_factory = sqlite3.Row
   return conn.cursor()
  
+def bulk_create(model, objects):
+  model.objects.bulk_create(objects, batch_size=BATCH_SIZE)
+
 METHOD_NAMES = {
   CrossReference: 'import_cross_references',
   Ending: 'import_endings',
@@ -81,6 +84,9 @@ METHOD_NAMES = {
  
 class ImportData(object):
   def __init__(self, db):
+    transaction.commit_unless_managed()
+    transaction.enter_transaction_management()
+    transaction.managed()
     self.cursor = connection.cursor()
     self.sqlite_cursor = get_cursor(db)
     no_history()
@@ -88,12 +94,19 @@ class ImportData(object):
   def close(self):
     self.cursor.close()
     self.sqlite_cursor.close()
+    transaction.commit()
+    transaction.leave_transaction_management()
+
  
   def new_lexical_classes(self):
     yield LexicalClass(symbol=OTHER)
     for row in self.sqlite_cursor.execute('select distinct pos from wzory'):
       yield LexicalClass(symbol=row['pos'])
  
+  def cache_lc(self):
+    if 'lc' not in self.__dict__:
+      self.lc = dict((lc.symbol, lc) for lc in LexicalClass.objects.all())
+
   def new_parts_of_speech(self):
     lcs = {}
     for row in self.sqlite_cursor.execute(
@@ -106,6 +119,16 @@ class ImportData(object):
       yield PartOfSpeech(
         symbol=row['pos'], lexical_class = LexicalClass.objects.get(symbol=lc))
  
+  def cache_pos(self):
+    if 'pos' not in self.__dict__:
+      self.pos = dict((pos.symbol, pos) for pos in PartOfSpeech.objects.all())
+
+  def cache_lc_pos(self):
+    if 'lc_pos' not in self.__dict__:
+      self.lc_pos = dict(
+        (pos.symbol, pos.lexical_class) for pos in PartOfSpeech.objects.all()
+      )
+
   def new_base_form_labels(self):
     query_result = self.sqlite_cursor.execute("""
       SELECT efobaz FROM paradygmaty
@@ -115,6 +138,10 @@ class ImportData(object):
     for row in query_result:
       yield BaseFormLabel(entry=row[0])
  
+  def cache_bfl(self):
+    if 'bfls' not in self.__dict__:
+      self.bfls = dict((bfl.entry, bfl) for bfl in BaseFormLabel.objects.all())
+
   def new_inflection_characteristics(self):
     for row in self.sqlite_cursor.execute(
             'SELECT DISTINCT charfl, pos FROM paradygmaty'):
@@ -130,9 +157,11 @@ class ImportData(object):
         part_of_speech=PartOfSpeech.objects.get(pk=row['pos']))
  
   def cache_ics(self):
-    self.ics = {}
-    for ic in InflectionCharacteristic.objects.all():
-      self.ics[(ic.basic_form_label.entry, ic.part_of_speech.symbol)] = ic
+    if 'ics' not in self.__dict__:
+      self.ics = dict(
+        ((ic.entry, ic.part_of_speech.symbol), ic)
+        for ic in InflectionCharacteristic.objects.all()
+      )
  
   def new_vocabularies(self):
     result = self.sqlite_cursor.execute("""
@@ -143,6 +172,10 @@ class ImportData(object):
     for row in result:
       yield Vocabulary(id = row[0])
  
+  def cache_vocabs(self):
+    if 'vocabs' not in self.__dict__:
+      self.vocabs = dict((v.id, v) for v in Vocabulary.objects.all())
+
   def new_qualifiers(self):
     sgjp = Vocabulary.objects.get(id=DEFAULT_VOCAB)
     query_result = self.sqlite_cursor.execute("""
@@ -160,51 +193,61 @@ class ImportData(object):
             added.add(qualifier_label)
             yield Qualifier(label=qualifier_label, vocabulary=sgjp)
  
-  def import_lexemes(self):
+  def cache_qualifiers(self):
+    if 'qual' not in self.__dict__:
+      self.qual = dict((q.label, q) for q in Qualifier.objects.all())
+
+  def new_lexemes(self):
+    self.cache_qualifiers()
     if MINI_MODE:
       result = self.sqlite_cursor.execute(
         MINI_LEXEME_QUERY % '*',(MINI_LEXEME_COUNT,))
     else:
       result = self.sqlite_cursor.execute('SELECT * FROM leksemy')
     date = datetime.datetime.now()
-    cv_table = dict(ClassificationValue.objects.values_list('label', 'pk'))
+    cv_table = dict(
+      (cv.label, cv) for cv in ClassificationValue.objects.all())
+    lexemes = []
+    lexeme_associations = []
+    lexeme_qualifiers = []
+    lexeme_cvs = []
     for row in result:
       slownik = row['slownik']
       status = 'conf' if slownik != 'zmiotki' else 'cand'
-      cv_pk = cv_table[row['pospolitosc']]
-      self.cursor.execute(
-        "INSERT INTO leksemy (id, haslo, haslosuf, glosa, nota, wymowa, hom, "
-        "pos, zrodlo, status, komentarz, data_modyfikacji, slownik, usuniety) "
-        "VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s)",
-        [row['nr'], row['haslo'], row['haslosuf'] or '', row['glosa'] or '',
-         row['nota'] or '', row['wymowa'] or '', 1, row['pos'], 'SGJP',
-         status, row['komentarz'], date, row['slownik'], False])
-      self.cursor.execute(
-        "INSERT INTO leksemy_w_slownikach (l_id, slownik) "
-        "VALUES (%s, %s)", [row['nr'], slownik])
-      self.cursor.execute(
-        "INSERT INTO wartosci_klasyfikacji_lexemes (classificationvalue_id, "
-        "lexeme_id) VALUES (%s, %s)", [cv_pk, row['nr']])
+      cv = cv_table[row['pospolitosc']]
+      lexemes.append(Lexeme(
+        id=row['nr'],
+        entry=row['haslo'],
+        entry_suffix=row['haslosuf'] or '',
+        gloss=row['glosa'] or '',
+        note=row['nota'] or '',
+        pronunciation=row['wymowa'] or '',
+        part_of_speech_id=row['pos'],
+        source='SGJP',
+        status=status,
+        comment=row['komentarz'] or '',
+        last_modified=date,
+        owner_vocabulary_id=slownik,
+      ))
+      lexeme_associations.append(LexemeAssociation(
+        lexeme_id=row['nr'], vocabulary_id=slownik))
+      lexeme_cvs.append((row['nr'], cv))
       if row['lkwal']:
         for qual in row['lkwal'].split('|'):
-          q_id = Qualifier.objects.get(label=qual).pk
-          self.cursor.execute(
-            "INSERT INTO kwalifikatory_leksemow (lexeme_id, "
-            "qualifier_id) VALUES (%s, %s)", [row['nr'], q_id])
+          lexeme_qualifiers.append((row['nr'], self.qual[qual]))
+    return lexemes, lexeme_associations, lexeme_cvs, lexeme_qualifiers
  
   def new_lexeme_associations(self):
+    self.cache_vocabs()
     if MINI_MODE:
       result = self.sqlite_cursor.execute(
         'SELECT * FROM slowniki_uzywajace WHERE nr in (%s)'
         % (MINI_LEXEME_QUERY % 'nr'), [MINI_LEXEME_COUNT])
     else:
       result = self.sqlite_cursor.execute('SELECT * FROM slowniki_uzywajace')
-    vocab_table = dict(
-      (v.id, v) for v in Vocabulary.objects.all()
-    )
     for row in result:
       yield LexemeAssociation(
-        vocabulary=vocab_table[row['slownik_uz']], lexeme_id=row['nr'])
+        vocabulary=self.vocabs[row['slownik_uz']], lexeme_id=row['nr'])
  
   def new_cross_reference_types(self):
     result = self.sqlite_cursor.execute(
@@ -221,7 +264,7 @@ class ImportData(object):
         to_pos=PartOfSpeech.objects.get(symbol=row['pos2']),
       )
  
-  def import_cross_references(self):
+  def new_cross_references(self):
     if MINI_MODE:
       result = self.sqlite_cursor.execute(
         'SELECT o.*, l1.pos pos1, l2.pos pos2 FROM odsylacze o '
@@ -249,129 +292,126 @@ class ImportData(object):
             type=cr_type)
  
   def import_pattern_types(self):
+    self.cache_lc_pos()
     result = self.sqlite_cursor.execute(
       'SELECT DISTINCT typr, pos FROM paradygmaty')
-    lc_pos_table = dict(
-      (pos.symbol, pos.lexical_class) for pos in PartOfSpeech.objects.all()
-    )
     for row in result:
-      lc = lc_pos_table[row['pos']]
+      lc = self.lc_pos[row['pos']]
       PatternType.objects.get_or_create(lexical_class=lc, entry=row['typr'])
     # prowizorka z powodu pustej klasy 'skr'
-    lc_table = dict(
-      (lc.symbol, lc) for lc in LexicalClass.objects.all()
-    )
+    self.cache_lc()
     result = self.sqlite_cursor.execute('SELECT DISTINCT typr, pos FROM wzory')
     for row in result:
-      lc = lc_table[row['pos']]
+      lc = self.lc[row['pos']]
       PatternType.objects.get_or_create(lexical_class=lc, entry=row['typr'])
  
+  def cache_ptypes(self):
+    if 'ptypes' not in self.__dict__:
+      self.ptypes = dict(
+        ((pt.lexical_class.symbol, pt.entry), pt)
+        for pt in PatternType.objects.all()
+      )
+
   def new_patterns(self):
-    pt_table = dict(
-      ((pt.lexical_class.symbol, pt.entry), pt)
-      for pt in PatternType.objects.all()
-    )
+    self.cache_ptypes()
     for row in self.sqlite_cursor.execute('SELECT * FROM wzory'):
-      pt = pt_table[(row['pos'], row['typr'])]
-      status = 'temp'
       yield Pattern(
         name=row['wzor'],
-        type=pt,
+        type=self.ptypes[(row['pos'], row['typr'])],
         basic_form_ending=row['zakp'],
         example=row['przyklad'] or '',
         comment=row['wkomentarz'] or '',
-        status = status,
+        status = 'temp',
       )
  
-  def import_endings(self):
-    if SQL_MODE:
-      pattern_pk_table = dict(Pattern.objects.values_list('name', 'pk'))
-      bfl_table = dict(BaseFormLabel.objects.values_list('entry', 'pk'))
+  def cache_patterns(self):
+    if 'paterns' not in self.__dict__:
+      self.patterns = dict((p.name, p) for p in Pattern.objects.all())
+
+  def new_endings(self):
+    self.cache_qualifiers()
+    self.cache_patterns()
+    self.cache_bfl()
+    endings = []
+    ending_quals = []
     for row in self.sqlite_cursor.execute('SELECT * FROM zakonczenia'):
       if row['zak'] is not None:
-        if not SQL_MODE:
-          e = Ending(
-            pattern=Pattern.objects.get(name=row['wzor']),
-            base_form_label = BaseFormLabel.objects.get(entry=row['efobaz']),
-            string = row['zak'],
-            index = row['nrskl'],
-          )
-          e.save()
+        endings.append(Ending(
+          pattern=self.patterns[row['wzor']],
+          base_form_label = self.bfls[row['efobaz']],
+          string = row['zak'],
+          index = row['nrskl'],
+        ))
+        if row['zkwal']:
           for qual in row['zkwal'].split('|'):
-            e.qualifiers.add(Qualifier.objects.get(label=qual)) #add
-        else:
-          pattern_pk = pattern_pk_table[row['wzor']]
-          if pattern_pk:
-            efobaz_id = bfl_table[row['efobaz']]
-            self.cursor.execute(
-              "INSERT INTO zakonczenia (w_id, efobaz, zind, zak) VALUES "
-              "(%s, %s, %s, %s)",
-              [pattern_pk, efobaz_id, row['nrskl'], row['zak']])
-            if row['zkwal']:
-              self.cursor.execute("select currval('zakonczenia_id_seq')")
-              last_id = self.cursor.fetchone()[0]
-              for qual in row['zkwal'].split('|'):
-                q_id = Qualifier.objects.get(label=qual).pk
-                self.cursor.execute(
-                  "INSERT INTO kwalifikatory_zakonczen (ending_id, qualifier_id) "
-                  "VALUES (%s, %s)", [last_id, q_id])
-
-  def import_lexeme_inflection_patterns(self):
+            ending_quals.append((
+              self.patterns[row['wzor']],
+              self.bfls[row['efobaz']],
+              row['nrskl'],
+              self.qual[qual]))
+    return endings, ending_quals
+
+  def new_lexeme_inflection_patterns(self):
+    self.cache_ics()
+    self.cache_qualifiers()
+    self.cache_patterns()
     if MINI_MODE:
       result = self.sqlite_cursor.execute(
-        'SELECT * FROM odmieniasie WHERE nr IN (%s)' % (MINI_LEXEME_QUERY % 'nr'),
+        'SELECT o.*, l.pos FROM odmieniasie o '
+        'JOIN leksemy l on o.nr = l.nr '
+        'WHERE l.nr IN (%s)' % (MINI_LEXEME_QUERY % 'nr'),
         (MINI_LEXEME_COUNT,))
     else:
       result = self.sqlite_cursor.execute('SELECT * FROM odmieniasie')
-    pos_table = dict(Lexeme.objects.values_list('pk', 'part_of_speech'))
-    pattern_pk_table = dict(Pattern.objects.values_list('name', 'pk'))
+    lips = []
+    lip_quals = []
     for row in result:
-      if not SQL_MODE:
-        lip = LexemeInflectionPattern(
-          lexeme_id=row['nr'],
-          index=row['oskl'],
-          pattern=Pattern.objects.get(name=row['wzor']),
-          inflection_characteristic=self.ics[
-            (row['charfl'], lip.lexeme.part_of_speech)],
-          root=row['rdzen'],
-        )
-        lip.save()
-        # nieaktualne
-        if row['okwal']:
-          lip.qualifiers.add(Qualifier.objects.get(label=row['okwal'])) #add
-      else:
-        pos = pos_table[row['nr']]
-        pattern_pk = pattern_pk_table[row['wzor']]
-        charfl_id = self.ics[(row['charfl'], pos)].pk
-        self.cursor.execute(
-          "INSERT INTO odmieniasie (l_id, oind, w_id, charfl, rdzen) "
-          "VALUES (%s, %s, %s, %s, %s) ", [row['nr'], row['oskl'], pattern_pk,
-          charfl_id, row['rdzen']])
-        if row['okwal']:
-          self.cursor.execute("select currval('odmieniasie_id_seq')")
-          last_id = self.cursor.fetchone()[0]
-          for qual in row['okwal'].split('|'):
-            q_id = Qualifier.objects.get(label=qual).pk
-            self.cursor.execute(
-              "INSERT INTO kwalifikatory_odmieniasiow (lexemeinflectionpattern_id, "
-              "qualifier_id) VALUES (%s, %s)", [last_id, q_id])
+      lexeme_id = row['nr']
+      lips.append(LexemeInflectionPattern(
+        lexeme_id=lexeme_id,
+        index=row['oskl'],
+        pattern=self.patterns[row['wzor']],
+        inflection_characteristic=self.ics[
+          (row['charfl'], row['pos'])],
+        root=row['rdzen'],
+      ))
+      if row['okwal']:
+        for qual in row['okwal'].split('|'):
+          lip_quals.append((lexeme_id, row['oskl'], self.qual[qual])) #add
+    return lips, lip_quals
+
+  def new_variants(self):
+    result = self.sqlite_cursor.execute(
+      'SELECT DISTINCT wariant FROM paradygmaty')
+    for row in result:
+      yield Variant(id=row['wariant'])
+
+  def new_table_templates(self):
+    self.cache_ics()
+    self.cache_ptypes()
+    self.cache_lc_pos()
+    result = self.sqlite_cursor.execute(
+      'SELECT DISTINCT wariant, pos, typr, charfl FROM paradygmaty')
+    for row in result:
+      yield TableTemplate(
+        variant_id=row['wariant'],
+        pattern_type=self.ptypes[(self.lc_pos[row['pos']].symbol, row['typr'])],
+        inflection_characteristic=self.ics[(row['charfl'], row['pos'])])
  
+  # to zostaje, bo tabelki i tak się pozmieniają
   def import_tables(self):
-    bfl_table = dict(BaseFormLabel.objects.values_list('entry', 'pk'))
-    lc_pos_table = dict(
-      (pos.symbol, pos.lexical_class) for pos in PartOfSpeech.objects.all()
+    self.cache_bfl()
+    tt_table = dict(
+      ((
+         tt.variant.id,
+         tt.pattern_type.entry,
+         tt.inflection_characteristic.entry,
+         tt.inflection_characteristic.part_of_speech.symbol,
+       ), tt) for tt in TableTemplate.objects.all()
     )
     for row in self.sqlite_cursor.execute('SELECT * FROM paradygmaty'):
-      lc = lc_pos_table[row['pos']]
-      variant, _created = Variant.objects.get_or_create(id=row['wariant'])
-      tt_data = {
-        'variant': variant,
-        'pattern_type': PatternType.objects.get(
-          entry=row['typr'], lexical_class=lc),
-        'inflection_characteristic': InflectionCharacteristic.objects.get(
-          entry=row['charfl'], part_of_speech_symbol=row['pos']),
-      }
-      tt, _created = TableTemplate.objects.get_or_create(**tt_data)
+      tt = tt_table[
+        (unicode(row['wariant']), row['typr'], row['charfl'], row['pos'])]
       if not SQL_MODE:
         c = Cell(
           table_template=tt,
@@ -392,7 +432,7 @@ class ImportData(object):
           )
           tc.save()
       else:
-        efobaz_id = bfl_table[row['efobaz']]
+        efobaz_id = self.bfls[row['efobaz']].id
         self.cursor.execute(
           "INSERT INTO klatki (st_id, efobaz, tag, prefiks, sufiks, kind) "
           "VALUES (%s, %s, %s, %s, %s, %s)", [tt.pk, efobaz_id, row['morf'],
@@ -421,19 +461,17 @@ class ImportData(object):
             rowspan=row['rowspan'],
             colspan=row['colspan'],
             label=row['nagl'],
-            horizontal=row['styl'] == 'h',
+            css_class=row['styl'],
           )
         else:
           raise Exception('Brak szablonu dla nagłówka: %s', dict(row))
  
   def delete_and_import(self):
-    transaction.commit_unless_managed()
-    transaction.enter_transaction_management()
-    transaction.managed()
     models = (
       TableCell,
       Cell,
       TableTemplate,
+      Variant,
       CrossReference,
       CrossReferenceType,
       LexemeAssociation,
@@ -454,63 +492,74 @@ class ImportData(object):
       model.objects.all().delete()
  
     print 'importing lexical classes...'
-    LexicalClass.objects.bulk_create(self.new_lexical_classes())
-    print 'importing parts of speech'
-    PartOfSpeech.objects.bulk_create(self.new_parts_of_speech())
-    print 'importing base form labels'
-    BaseFormLabel.objects.bulk_create(self.new_base_form_labels())
-    print 'importing inflection characteristics'
-    InflectionCharacteristic.objects.bulk_create(
+    bulk_create(LexicalClass, self.new_lexical_classes())
+    print 'importing parts of speech...'
+    bulk_create(PartOfSpeech, self.new_parts_of_speech())
+    print 'importing base form labels...'
+    bulk_create(BaseFormLabel, self.new_base_form_labels())
+    print 'importing inflection characteristics...'
+    bulk_create(InflectionCharacteristic,
       self.new_inflection_characteristics())
     print 'importing vocabularies...'
-    Vocabulary.objects.bulk_create(self.new_vocabularies())
+    bulk_create(Vocabulary, self.new_vocabularies())
     print 'importing qualifiers...'
-    Qualifier.objects.bulk_create(self.new_qualifiers())
-    print 'importing lexemes...'
-    self.import_lexemes()
-    print 'importing lexeme associations...'
-    LexemeAssociation.objects.bulk_create(self.new_lexeme_associations())
-    print 'importing cross-reference types...'
-    CrossReferenceType.objects.bulk_create(
-      self.new_cross_reference_types())
-    print 'importing cross-references...'
-    self.import_cross_references()
+    bulk_create(Qualifier, self.new_qualifiers())
     print 'importing pattern types...'
     self.import_pattern_types()
     print 'importing patterns...'
-    Pattern.objects.bulk_create(self.new_patterns())
-    print 'importing lexeme inflection patterns...'
-    self.import_lexeme_inflection_patterns()
+    bulk_create(Pattern, self.new_patterns())
     print 'importing endings...'
-    self.import_endings()
+    endings, ending_quals = self.new_endings()
+    bulk_create(Ending, endings)
+    for pattern, bfl, index, q in ending_quals:
+      Ending.objects.get(
+        pattern=pattern, base_form_label=bfl, index=index).qualifiers.add(q)
+    def import_lexemes():
+      print 'importing lexemes...'
+      lexemes, lexeme_assoc, lexeme_cvs, lexeme_quals = self.new_lexemes()
+      print '...'
+      bulk_create(Lexeme, lexemes)
+      print '...'
+      bulk_create(LexemeAssociation, lexeme_assoc)
+      print '...'
+      for lexeme_id, cv in lexeme_cvs:
+        cv.lexemes.add(lexeme_id) #add
+      print '...'
+      for lexeme_id, q in lexeme_quals:
+        q.lexeme_set.add(lexeme_id) #add
+    import_lexemes()
+    def import_lips():
+      print 'importing lexeme inflection patterns...'
+      lips, lip_quals = self.new_lexeme_inflection_patterns()
+      print '...'
+      bulk_create(LexemeInflectionPattern, lips)
+      print '...'
+      for lexeme_id, index, q in lip_quals:
+        LexemeInflectionPattern.objects.get(
+          lexeme_id=lexeme_id, index=index).qualifiers.add(q)
+    import_lips()
+    print 'importing lexeme associations...'
+    bulk_create(LexemeAssociation, self.new_lexeme_associations())
+    print 'importing cross-reference types...'
+    bulk_create(CrossReferenceType,
+      self.new_cross_reference_types())
+    print 'importing cross-references...'
+    bulk_create(CrossReference, self.new_cross_references())
+    print 'importing variants...'
+    bulk_create(Variant, self.new_variants())
     print 'importing table templates...'
+    bulk_create(TableTemplate, self.new_table_templates())
+    print 'importing tables...'
     self.import_tables()
     print 'importing table headers...'
-    TableHeader.objects.bulk_create(self.new_table_headers())
+    bulk_create(TableHeader, self.new_table_headers())
+    print 'committing to database...'
     self.close()
-    transaction.commit()
-    transaction.leave_transaction_management()
  
   def single_import(self, model):
-    transaction.commit_unless_managed()
-    transaction.enter_transaction_management()
-    transaction.managed()
     method_name = METHOD_NAMES[model]
     if method_name.startswith('new'):
-      model.objects.bulk_create(self.__getattribute__(method_name)())
+      bulk_create(model, self.__getattribute__(method_name)())
     elif method_name.startswith('import'):
       self.__getattribute__(method_name)()
-    self.close()
-    transaction.commit()
-    transaction.leave_transaction_management()
-
-import sys
-if __name__ == '__main__':
-  if sys.argv[-1] == '-mini':
-    MINI_MODE = True
-    del sys.argv[-1]
-  if len(sys.argv) > 1:
-    db = sys.argv[1]
-  else:
-    db = DEFAULT_DATABASE
-  ImportData(db).delete_and_import()
+    self.close()
 \ No newline at end of file
@@ -79,7 +79,7 @@ class Qualifier(Model):
     return self.label
  
   class Meta:
-    unique_together = ['label', 'vocabulary']
+    unique_together = ('label', 'vocabulary')
     db_table = 'kwalifikatory'
     ordering = ['label']
  
@@ -192,7 +192,7 @@ class InflectionCharacteristic(Model):
  
   class Meta:
     db_table = 'charfle'
-    unique_together = ['entry', 'part_of_speech']
+    unique_together = ('entry', 'part_of_speech')
  
  
 class PatternType(Model):
@@ -324,7 +324,7 @@ class Lexeme(Model):
   gloss = TextField(blank=True, db_column='glosa', verbose_name=u'glosa')
   note = TextField(blank=True, db_column='nota', verbose_name=u'nota')
   pronunciation = TextField(blank=True, db_column='wymowa', verbose_name=u'wymowa')
-  homonym_number = IntegerField(db_column='hom')
+  homonym_number = IntegerField(db_column='hom', default=1)
   part_of_speech = ForeignKey(PartOfSpeech, db_column='pos',
                               verbose_name=u'cz. mowy')
   owner_vocabulary = ForeignKey(
@@ -571,7 +571,7 @@ class LexemeInflectionPattern(Model):
       table[y][x] = {
         'type': 'label',
         'label': [header.label],
-        'row_header': header.row_header,
+        'css_class': header.css_class,
         'rowspan': header.rowspan,
         'colspan': header.colspan,
       }
@@ -732,6 +732,8 @@ def managed_vocabularies(user):
   else:
     return user.managed_vocabularies.all()
  
+# kiedyś miało dodatkowe pole, a teraz istnieje tylko dlatego,
+# że zapuściło korzenie
 class LexemeAssociation(Model):
   lexeme = ForeignKey(Lexeme, db_column='l_id')
   vocabulary = ForeignKey(Vocabulary, db_column='slownik')
@@ -865,10 +867,12 @@ class TableHeader(Model):
   rowspan = IntegerField()
   colspan = IntegerField()
   label = CharField(max_length=64, blank=True, db_column='nagl')
-  row_header = BooleanField(db_column='wierszowy')
+  row_header = BooleanField(db_column='wierszowy') # tymczasowo
+  css_class = BooleanField(db_column='styl')
  
   def __unicode__(self):
-    return '%s : %s : %s' % (self.label, self.row, self.col)
+    return '%s (%s,%s) [%s]' % (
+      self.label, self.row, self.col, self.css_class)
  
   class Meta:
     db_table = 'naglowki_tabel'
@@ -2,41 +2,41 @@
 <caption>{{ inflection_characteristic.entry }}</caption>
 {% for row in table %}
   <tr>
-  {% for cell in row %}
-    {% if cell.type != 'span' %}
-      {% if cell.type == 'empty' %}
-        <td class='EmptyCell' ></td>
-      {% else %}
-        {% if cell.type == 'forms' %}
-          <td rowspan="{{cell.rowspan}}" colspan="{{cell.colspan}}">
-          <ul class='FormList'>
-          {% for entry in cell.forms %}
-            <li>
-              {{ entry.form }}
-              <span class="qualifiers">
-                {% for q in entry.qualifiers %}
-                  {{ q.label }}
-                {% endfor %}
-              </span>
-            </li>
-          {% endfor %}
-          </ul>
-          </td>
+    {% for cell in row %}
+      {% if cell.type != 'span' %}
+        {% if cell.type == 'empty' %}
+          <td class='EmptyCell' ></td>
         {% else %}
-          <td rowspan="{{cell.rowspan}}" colspan="{{cell.colspan}}"
-              class="{{cell.row_header|yesno:"RowHeader,ColumnHeader"}}">
-            <ul class="FormList">
-              {% for label in cell.label %}
-                <li>
-                  {{ label|safe }}
-                </li>
-              {% endfor %}
-            </ul>
-          </td>
+          {% if cell.type == 'forms' %}
+            <td rowspan="{{ cell.rowspan }}" colspan="{{ cell.colspan }}">
+              <ul class='FormList'>
+                {% for entry in cell.forms %}
+                  <li>
+                    {{ entry.form }}
+                    <span class="qualifiers">
+                      {% for q in entry.qualifiers %}
+                        {{ q.label }}
+                      {% endfor %}
+                    </span>
+                  </li>
+                {% endfor %}
+              </ul>
+            </td>
+          {% else %}
+            <td rowspan="{{ cell.rowspan }}" colspan="{{ cell.colspan }}"
+                class="{{ cell.css_class }}">
+              <ul class="FormList">
+                {% for label in cell.label %}
+                  <li>
+                    {{ label|safe }}
+                  </li>
+                {% endfor %}
+              </ul>
+            </td>
+          {% endif %}
         {% endif %}
       {% endif %}
-    {% endif %}
-  {% endfor %}
+    {% endfor %}
   </tr>
 {% endfor %}
 </table>