IMAGENAMER/Imagenamer.py

"""This Program is used to rename image files with its content"""

"""SETUP"""
try:
    from PIL import Image
except ImportError:
    import Image
import pytesseract
import os
import string

namearray = []
indexnow = 0

pytesseract.tesseract_cmd = r'C:\Program Files (x86)\Tesseract-OCR\tesseract' #absolute path to out tesseract instalation

"""FUNCTIONS"""
def ocr(filename):
    newname = pytesseract.image_to_string(Image.open(absolutebasepathin+"\\"+filename))  # Use pillow to open an image for pytesseract image2string to use
    return newname

def namecleaner(filename):
    print("filenameis "+filename)
<<<<<<< HEAD
    filename = "_".join(filename.split()) # Get rig of line braks and spaces
    filename = filename.replace("__","_") # Cleaning duplicated '_'s
    filename = filename.replace(" ","") # Get rig of spaces(For recursion)
    filename = filename.replace("\n","") # Get rig of line braks(For recursion)
    #Get rid of forbiden characters
=======
    filename = "_".join(filename.split())
    filename = filename.replace("__","_")
    filename = filename.replace(" ","")
    filename = filename.replace("\n","")
>>>>>>> 1ab02cad0d56cf6bd1aa7748ddb11ff8220f9919
    filename = filename.replace("<","")
    filename = filename.replace(">","")
    filename = filename.replace(":","")
    filename = filename.replace("\"","")
    filename = filename.replace("/","")
    filename = filename.replace("\\","")
    filename = filename.replace("|","")
    filename = filename.replace("?","")
    filename = filename.replace("*","")
    ##################################
    filename = filename.replace(".","") # Get rid of extra dots
    outputname = filename+basename[len(basename)-4:len(basename)] # Get the extension of the file
    print("outputnameis "+outputname)
    return outputname

"""CORECODE"""
# Define the input and output directories
basepathin = '.\ImagesToConvert'
print("basepathin = "+basepathin)
basepathout = '.\ImageOutput'
print("basepathout = "+basepathout)

# Getting the absolute path to the before named directories
absolutebasepathin = os.path.abspath('.\ImagesToConvert')
print("absolutebasepathin = "+absolutebasepathin)
absolutebasepathout = os.path.abspath('.\ImagesOutput')
print("absolutebasepathout = "+absolutebasepathout)

# List all files in a directory using scandir()
with os.scandir(basepathin) as entries:
    for entry in entries:
        if entry.is_file():
            # Fill an array with the list
            namearray.append(entry.name)

# Get array length for the loop
arraylength = len(namearray)
print("arraylength = "+str(arraylength))

while indexnow < arraylength:
    # Get file name from the array
    basename = namearray[indexnow]
    print("basename = "+basename)
    # Call ocr
    newname = ocr(basename)
    print("newname = "+newname)
    # Call "namecleaner" to get rid of forbiden characters, line breaks and spaces.
    cleanname = namecleaner(newname)
    print("cleanname = "+cleanname)
    os.rename(absolutebasepathin+"\\"+basename, absolutebasepathout+"\\"+cleanname)
    print(basename+" is now renamed as "+cleanname)
    indexnow = indexnow + 1


print("All images are given a name")
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`"""This Program is used to rename image files with its content"""`

			`"""SETUP"""`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`try:`
			`from PIL import Image`
			`except ImportError:`
			`import Image`
			`import pytesseract`
			`import os`
			`import string`

			`namearray = []`
			`indexnow = 0`

I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`pytesseract.tesseract_cmd = r'C:\Program Files (x86)\Tesseract-OCR\tesseract' #absolute path to out tesseract instalation`
First no error image renamer code 2020-09-09 18:06:33 +00:00
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`"""FUNCTIONS"""`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`def ocr(filename):`
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`newname = pytesseract.image_to_string(Image.open(absolutebasepathin+"\\"+filename)) # Use pillow to open an image for pytesseract image2string to use`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`return newname`

			`def namecleaner(filename):`
			`print("filenameis "+filename)`
Merge branch 'master' of https://github.com/AlieNeon/Imagenamer 2020-09-10 07:55:19 +00:00			`<<<<<<< HEAD`
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`filename = "_".join(filename.split()) # Get rig of line braks and spaces`
			`filename = filename.replace("__","_") # Cleaning duplicated '_'s`
			`filename = filename.replace(" ","") # Get rig of spaces(For recursion)`
			`filename = filename.replace("\n","") # Get rig of line braks(For recursion)`
			`#Get rid of forbiden characters`
Merge branch 'master' of https://github.com/AlieNeon/Imagenamer 2020-09-10 07:55:19 +00:00			`=======`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`filename = "_".join(filename.split())`
I forgot to comment in the last commit, but now all is commented :D 2020-09-10 07:42:36 +00:00			`filename = filename.replace("__","_")`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`filename = filename.replace(" ","")`
			`filename = filename.replace("\n","")`
Merge branch 'master' of https://github.com/AlieNeon/Imagenamer 2020-09-10 07:55:19 +00:00			`>>>>>>> 1ab02cad0d56cf6bd1aa7748ddb11ff8220f9919`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`filename = filename.replace("<","")`
			`filename = filename.replace(">","")`
			`filename = filename.replace(":","")`
			`filename = filename.replace("\"","")`
			`filename = filename.replace("/","")`
			`filename = filename.replace("\\","")`
			`filename = filename.replace("\|","")`
			`filename = filename.replace("?","")`
			`filename = filename.replace("*","")`
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`##################################`
			`filename = filename.replace(".","") # Get rid of extra dots`
			`outputname = filename+basename[len(basename)-4:len(basename)] # Get the extension of the file`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`print("outputnameis "+outputname)`
			`return outputname`

I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`"""CORECODE"""`
			`# Define the input and output directories`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`basepathin = '.\ImagesToConvert'`
			`print("basepathin = "+basepathin)`
			`basepathout = '.\ImageOutput'`
			`print("basepathout = "+basepathout)`
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00
			`# Getting the absolute path to the before named directories`
			`absolutebasepathin = os.path.abspath('.\ImagesToConvert')`
			`print("absolutebasepathin = "+absolutebasepathin)`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`absolutebasepathout = os.path.abspath('.\ImagesOutput')`
			`print("absolutebasepathout = "+absolutebasepathout)`
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00
			`# List all files in a directory using scandir()`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`with os.scandir(basepathin) as entries:`
			`for entry in entries:`
			`if entry.is_file():`
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`# Fill an array with the list`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`namearray.append(entry.name)`

I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`# Get array length for the loop`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`arraylength = len(namearray)`
			`print("arraylength = "+str(arraylength))`

			`while indexnow < arraylength:`
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`# Get file name from the array`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`basename = namearray[indexnow]`
			`print("basename = "+basename)`
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`# Call ocr`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`newname = ocr(basename)`
			`print("newname = "+newname)`
I forgot to comment in the last commit, but now all is commented :D now for real bc i fogot to save 2020-09-10 07:55:00 +00:00			`# Call "namecleaner" to get rid of forbiden characters, line breaks and spaces.`
First no error image renamer code 2020-09-09 18:06:33 +00:00			`cleanname = namecleaner(newname)`
			`print("cleanname = "+cleanname)`
			`os.rename(absolutebasepathin+"\\"+basename, absolutebasepathout+"\\"+cleanname)`
			`print(basename+" is now renamed as "+cleanname)`
			`indexnow = indexnow + 1`


			`print("All images are given a name")`