commit 7b1494b265f47fc0ea2f644c3417a14830fcaf82 Author: vivekvardhanadepu Date: Sun Jul 11 21:21:50 2021 +0530 Scripts fixup diff --git a/scripts/extract-freq-lexicon.py b/scripts/extract-freq-lexicon.py index 3534ac6..ef7b427 100755 --- a/scripts/extract-freq-lexicon.py +++ b/scripts/extract-freq-lexicon.py @@ -4,6 +4,7 @@ import sys import common +import traceback # Read the corpus, make a note of all ambiguous words, their frequency and their possible translations @@ -69,6 +70,7 @@ def extract_freq_lexicon(canditates): tlword = cur_tl_row[al_tl] else: tlword = cur_tl_row[-1] + traceback.print_stack() print("alignment out", "of", "range", al_tl, @@ -77,6 +79,7 @@ def extract_freq_lexicon(canditates): cur_tl_row, ")", file=sys.stderr) + exit(1) slword = slword if slword not in sl_tl: # { sl_tl[slword] = {} @@ -107,9 +110,10 @@ def extract_freq_lexicon(canditates): # } cur_line = cur_line + 1 - except Exception as e: - print("Error in line", lineno, ":", e, file=sys.stderr) - sys.exit(-1) + except Exception: + # print("Error in line", lineno, ":", e, file=sys.stderr) + traceback.print_exc() + exit(1) # } # } @@ -142,7 +146,7 @@ def extract_freq_lexicon(canditates): if __name__ == '__main__': if len(sys.argv) < 2: # { - print('extract-freq-lexicon.py ') + print('Usage: extract-freq-lexicon.py ', file=sys.stderr) exit(1) # } extract_freq_lexicon(sys.argv[1]) diff --git a/scripts/extract-sentences.py b/scripts/extract-sentences.py index 8d7ee06..c80f77b 100755 --- a/scripts/extract-sentences.py +++ b/scripts/extract-sentences.py @@ -23,21 +23,19 @@ def ambiguous(bt): # { def extract_sentences(phrase_table_file, biltrans_out_file): - reading = True lineno = 0 total_valid = 0 total_errors = 0 not_ambiguous = [] with open(phrase_table_file) as phrase_table, open(biltrans_out_file) as biltrans_out: - while reading: # { + while True: # { try: lineno = lineno + 1 pt_line = phrase_table.readline().strip() bt_line = biltrans_out.readline().strip() if not bt_line.strip() and not pt_line.strip(): # { - reading = False break elif not bt_line.strip() or not pt_line.strip(): # { continue @@ -83,8 +81,7 @@ def extract_sentences(phrase_table_file, biltrans_out_file): print(lineno, '\t' + bt_line) print(lineno, '\t' + row[0]) print(lineno, '\t' + row[2]) - print( - '-------------------------------------------------------------------------------') + print('-'*(len(bt_line)+5)) total_valid += 1 except Exception as e: print("Error in line", lineno, ": ", e, file=sys.stderr) @@ -102,7 +99,7 @@ def extract_sentences(phrase_table_file, biltrans_out_file): if __name__ == '__main__': if len(sys.argv) < 3: # { - print('extact-sentences.py ') + print('Usage: extact-sentences.py ', file=sys.stderr) exit(1) # } diff --git a/scripts/lambdas-to-rules.py b/scripts/lambdas-to-rules.py index d02b87f..745c7c7 100644 --- a/scripts/lambdas-to-rules.py +++ b/scripts/lambdas-to-rules.py @@ -83,7 +83,7 @@ def lambdas_to_rules(freq_lexicon, rules): if __name__ == '__main__': if len(sys.argv) < 3: # { - print('lambdas-to-rules.py ') + print('Usage: lambdas-to-rules.py ', file=sys.stderr) exit(1) # } lambdas_to_rules(sys.argv[1], sys.argv[2]) diff --git a/scripts/merge-ngrams-lambdas.py b/scripts/merge-ngrams-lambdas.py index 1595d26..3ceb065 100644 --- a/scripts/merge-ngrams-lambdas.py +++ b/scripts/merge-ngrams-lambdas.py @@ -47,7 +47,7 @@ def merge_ngrams_lambdas(ngf, ldf): if __name__ == '__main__': if len(sys.argv) < 3: # { - print('merge-ngrams-lambdas.py ') + print('Usage: merge-ngrams-lambdas.py ', file=sys.stderr) exit(1) # } merge_ngrams_lambdas(sys.argv[1], sys.argv[2]) diff --git a/scripts/ngram-count-patterns-maxent2.py b/scripts/ngram-count-patterns-maxent2.py index 693fc82..c3a9714 100755 --- a/scripts/ngram-count-patterns-maxent2.py +++ b/scripts/ngram-count-patterns-maxent2.py @@ -269,7 +269,8 @@ def ngram_count_patterns(freq_lexicon, candidates): if __name__ == '__main__': if len(sys.argv) not in [3, 4]: # { - print('count-patterns.py [threshold]') + print( + 'Usage: count-patterns.py [threshold]', file=sys.stderr) exit(1) # } diff --git a/scripts/ngrams-to-rules-me.py b/scripts/ngrams-to-rules-me.py index 87d0fad..ded1119 100755 --- a/scripts/ngrams-to-rules-me.py +++ b/scripts/ngrams-to-rules-me.py @@ -177,7 +177,7 @@ def ngrams_to_rules(ngrams): if __name__ == '__main__': if len(sys.argv) < 2: # { - print('ngrams-to-rules.py ') + print('Usage: ngrams-to-rules.py ', file=sys.stderr) exit(1) # } ngrams_to_rules(sys.argv[1])