From c15c2a88896b1baab8d180607d66e1ba8befa70b Mon Sep 17 00:00:00 2001 From: Mattia Rizzolo Date: Wed, 23 Oct 2019 18:05:13 +0200 Subject: flake8 fixes to the dictionary-to-thesaurus script tested to work with both python3 and 2.7. Change-Id: I52fe00e1f33e605010cd99885c1a41396440e49d Signed-off-by: Mattia Rizzolo Reviewed-on: https://gerrit.libreoffice.org/81411 Reviewed-by: Thorsten Behrens Reviewed-by: Michael Stahl Tested-by: Michael Stahl --- cs_CZ/thesaurus/dictionary-to-thesaurus.py | 30 +++++++++++++++++++----------- 1 file changed, 19 insertions(+), 11 deletions(-) diff --git a/cs_CZ/thesaurus/dictionary-to-thesaurus.py b/cs_CZ/thesaurus/dictionary-to-thesaurus.py index 3ab22cf..ac4fe67 100755 --- a/cs_CZ/thesaurus/dictionary-to-thesaurus.py +++ b/cs_CZ/thesaurus/dictionary-to-thesaurus.py @@ -18,13 +18,17 @@ import os import re import sys + def usage(): message = """Usage: {program} en-cs.txt blacklist.txt en-cs.txt: Dictionary data from https://www.svobodneslovniky.cz/ blacklist.txt: List of words that should be ignored when generating """ - sys.stderr.write(message.format(program = os.path.basename(sys.argv[0]))) + print( + message.format(program=os.path.basename(sys.argv[0])), + file=sys.stderr) + def classify(typ): if typ == '': @@ -40,6 +44,7 @@ def classify(typ): return '' + def parse(filename, blacklistname): blacklist = {} @@ -92,7 +97,7 @@ def parse(filename, blacklistname): typ = terms[2] # ignore non-translations - if match_ignore.search(typ) != None: + if match_ignore.search(typ) is not None: continue typ = match_cleanup.sub('', typ) @@ -101,24 +106,25 @@ def parse(filename, blacklistname): typ = classify(typ) if index in synonyms: - synonyms[index].append( (word, typ) ) + synonyms[index].append((word, typ)) else: - synonyms[index] = [ (word, typ) ] + synonyms[index] = [(word, typ)] if word in meanings: meanings[word].append(index) else: - meanings[word] = [ index ] + meanings[word] = [index] if typ != '': if word in classification: - if not typ in classification[word]: + if typ not in classification[word]: classification[word].append(typ) else: - classification[word] = [ typ ] + classification[word] = [typ] return (synonyms, meanings, classification) + def buildThesaurus(synonyms, meanings, classification): # for every word: # find all the indexes, and then again map the indexes to words - these are the synonyms @@ -133,7 +139,7 @@ def buildThesaurus(synonyms, meanings, classification): typ = classification[word][0] # we want to output each word just once - used_this_round = [ word ] + used_this_round = [word] output_lines = [] for index in indexes: @@ -142,7 +148,7 @@ def buildThesaurus(synonyms, meanings, classification): # collect types first types = [] for (w, t) in syns: - if not t in types: + if t not in types: types.append(t) # build the various thesaurus lines @@ -153,7 +159,7 @@ def buildThesaurus(synonyms, meanings, classification): if typ != '' and t != '' and typ != t: continue - if not w in used_this_round: + if w not in used_this_round: if t in line: line[t] += '|' + w else: @@ -163,7 +169,7 @@ def buildThesaurus(synonyms, meanings, classification): if len(line) != 0: for t in types: if t in line: - output_lines.append( (t, line[t]) ) + output_lines.append((t, line[t])) if len(output_lines) > 0: print word + '|' + str(len(output_lines)) @@ -180,6 +186,7 @@ def buildThesaurus(synonyms, meanings, classification): else: print line + def main(args): if (len(args) != 3): usage() @@ -190,6 +197,7 @@ def main(args): print "UTF-8" buildThesaurus(synonyms, meanings, classification) + if __name__ == "__main__": main(sys.argv) -- cgit