updated erase & replace python script with sort function

7 years ago · 9e1f618b68
parent cc9c5b39ac
commit 9e1f618b68
2 changed files with 4 additions and 4 deletions
--- a/src/erase_leastcommon.py
+++ b/src/erase_leastcommon.py
@ -46,8 +46,8 @@ def filternone(word_raw):
 x = -1
 leastcommon_list = []
 allwords = []
-scanimg = glob.glob('images-tiff/*.tiff')
-hocr = glob.glob('hocr/*.html')
+scanimg = sorted(glob.glob('images-tiff/*.tiff'))
+hocr = sorted(glob.glob('hocr/*.html'))
 maximum = 20 / len(scanimg) # this helps the script remove words in a way that is proportional to number of pages scanned 

 # loop through every image in scanimg folder
--- a/src/replace_leastcommon.py
+++ b/src/replace_leastcommon.py
@ -63,8 +63,8 @@ def filternone(word_raw):
 x = -1
 leastcommon_list = []
 allwords = []
-scanimg = glob.glob('images-tiff/*.tiff')
-hocr = glob.glob('hocr/*.html')
+scanimg = sorted(glob.glob('images-tiff/*.tiff'))
+hocr = sorted(glob.glob('hocr/*.html'))
 num = 0
 maximum = 20 / len(scanimg) # this helps the script remove words in a way that is proportional to number of pages scanned