[Libreoffice-commits] dictionaries.git: cs_CZ/thesaurus

Thu Oct 24 09:26:29 UTC 2019

cs_CZ/thesaurus/dictionary-to-thesaurus.py |   30 ++++++++++++++++++-----------
 1 file changed, 19 insertions(+), 11 deletions(-)

New commits:
commit c15c2a88896b1baab8d180607d66e1ba8befa70b
Author:     Mattia Rizzolo <mattia at mapreri.org>
AuthorDate: Wed Oct 23 18:05:13 2019 +0200
Commit:     Michael Stahl <michael.stahl at cib.de>
CommitDate: Thu Oct 24 11:26:09 2019 +0200

    flake8 fixes to the dictionary-to-thesaurus script
    
    tested to work with both python3 and 2.7.
    
    Change-Id: I52fe00e1f33e605010cd99885c1a41396440e49d
    Signed-off-by: Mattia Rizzolo <mattia at mapreri.org>
    Reviewed-on: https://gerrit.libreoffice.org/81411
    Reviewed-by: Thorsten Behrens <Thorsten.Behrens at CIB.de>
    Reviewed-by: Michael Stahl <michael.stahl at cib.de>
    Tested-by: Michael Stahl <michael.stahl at cib.de>

diff --git a/cs_CZ/thesaurus/dictionary-to-thesaurus.py b/cs_CZ/thesaurus/dictionary-to-thesaurus.py
index 3ab22cf..ac4fe67 100755
--- a/cs_CZ/thesaurus/dictionary-to-thesaurus.py
+++ b/cs_CZ/thesaurus/dictionary-to-thesaurus.py
@@ -18,13 +18,17 @@ import os
 import re
 import sys
 
+
 def usage():
     message = """Usage: {program} en-cs.txt blacklist.txt
 
   en-cs.txt:     Dictionary data from https://www.svobodneslovniky.cz/
   blacklist.txt: List of words that should be ignored when generating
 """
-    sys.stderr.write(message.format(program = os.path.basename(sys.argv[0])))
+    print(
+        message.format(program=os.path.basename(sys.argv[0])),
+        file=sys.stderr)
+
 
 def classify(typ):
     if typ == '':
@@ -40,6 +44,7 @@ def classify(typ):
 
     return ''
 
+
 def parse(filename, blacklistname):
     blacklist = {}
 
@@ -92,7 +97,7 @@ def parse(filename, blacklistname):
                     typ = terms[2]
 
                     # ignore non-translations
-                    if match_ignore.search(typ) != None:
+                    if match_ignore.search(typ) is not None:
                         continue
 
                     typ = match_cleanup.sub('', typ)
@@ -101,24 +106,25 @@ def parse(filename, blacklistname):
                 typ = classify(typ)
 
                 if index in synonyms:
-                    synonyms[index].append( (word, typ) )
+                    synonyms[index].append((word, typ))
                 else:
-                    synonyms[index] = [ (word, typ) ]
+                    synonyms[index] = [(word, typ)]
 
                 if word in meanings:
                     meanings[word].append(index)
                 else:
-                    meanings[word] = [ index ]
+                    meanings[word] = [index]
 
                 if typ != '':
                     if word in classification:
-                        if not typ in classification[word]:
+                        if typ not in classification[word]:
                             classification[word].append(typ)
                     else:
-                        classification[word] = [ typ ]
+                        classification[word] = [typ]
 
     return (synonyms, meanings, classification)
 
+
 def buildThesaurus(synonyms, meanings, classification):
     # for every word:
     #   find all the indexes, and then again map the indexes to words - these are the synonyms
@@ -133,7 +139,7 @@ def buildThesaurus(synonyms, meanings, classification):
             typ = classification[word][0]
 
         # we want to output each word just once
-        used_this_round = [ word ]
+        used_this_round = [word]
 
         output_lines = []
         for index in indexes:
@@ -142,7 +148,7 @@ def buildThesaurus(synonyms, meanings, classification):
             # collect types first
             types = []
             for (w, t) in syns:
-                if not t in types:
+                if t not in types:
                     types.append(t)
 
             # build the various thesaurus lines
@@ -153,7 +159,7 @@ def buildThesaurus(synonyms, meanings, classification):
                 if typ != '' and t != '' and typ != t:
                     continue
 
-                if not w in used_this_round:
+                if w not in used_this_round:
                     if t in line:
                         line[t] += '|' + w
                     else:
@@ -163,7 +169,7 @@ def buildThesaurus(synonyms, meanings, classification):
             if len(line) != 0:
                 for t in types:
                     if t in line:
-                        output_lines.append( (t, line[t]) )
+                        output_lines.append((t, line[t]))
 
         if len(output_lines) > 0:
             print word + '|' + str(len(output_lines))
@@ -180,6 +186,7 @@ def buildThesaurus(synonyms, meanings, classification):
                         else:
                             print line
 
+
 def main(args):
     if (len(args) != 3):
         usage()
@@ -190,6 +197,7 @@ def main(args):
     print "UTF-8"
     buildThesaurus(synonyms, meanings, classification)
 
+
 if __name__ == "__main__":
     main(sys.argv)