|
@@ -3,10 +3,6 @@
|
|
|
from PIL import Image
|
|
|
from pprint import pprint
|
|
|
|
|
|
-<<<<<<< Updated upstream
|
|
|
-import sys, time, os, requests, random, json, argparse
|
|
|
-import subprocess, yaml
|
|
|
-=======
|
|
|
import sys
|
|
|
import time
|
|
|
import os
|
|
@@ -15,7 +11,6 @@ import random
|
|
|
import json
|
|
|
import argparse
|
|
|
import subprocess
|
|
|
->>>>>>> Stashed changes
|
|
|
|
|
|
parser = argparse.ArgumentParser(description="S0urce.io utility program.")
|
|
|
parser.add_argument("--download", help="Download Images", action="store_true")
|
|
@@ -263,13 +258,6 @@ def run(difficult, index):
|
|
|
Where we ask the user what the word is, and after that we save all that to a file in the data directory.
|
|
|
"""
|
|
|
|
|
|
-<<<<<<< Updated upstream
|
|
|
- fname = f"images/{difficult}_{x}.png"
|
|
|
-
|
|
|
- if not os.path.exists(fname):
|
|
|
- print("Could not find '{0}'".format(fname))
|
|
|
- return False # We did not complete
|
|
|
-=======
|
|
|
for x in range(0, 70):
|
|
|
fname = image_filename(difficult, x)
|
|
|
|
|
@@ -278,7 +266,6 @@ def run(difficult, index):
|
|
|
# continue
|
|
|
# We've reached the end, so stop looking. :P
|
|
|
break
|
|
|
->>>>>>> Stashed changes
|
|
|
|
|
|
print(f"Loading: {fname}")
|
|
|
im = Image.open(fname)
|
|
@@ -310,13 +297,9 @@ def run(difficult, index):
|
|
|
# print(f"File '{fname}' automatically removed")
|
|
|
|
|
|
|
|
|
-<<<<<<< Updated upstream
|
|
|
-def autotrain(difficult, index):
|
|
|
-=======
|
|
|
key_word = {}
|
|
|
|
|
|
def autotrain(difficult):
|
|
|
->>>>>>> Stashed changes
|
|
|
"""
|
|
|
run, represents a single execution of components to the image, (Actuall we do it 1 category at a time instead of just 1 single execution )
|
|
|
those components do the following... (Each category has around 70 items so we standardize on 70, but )
|
|
@@ -327,29 +310,6 @@ def autotrain(difficult):
|
|
|
Where we ask the user what the word is, and after that we save all that to a file in the data directory.
|
|
|
"""
|
|
|
|
|
|
-<<<<<<< Updated upstream
|
|
|
- # Re aranged the code so I can have it return after each word
|
|
|
- fname = f"images/{difficult}_{x}.png"
|
|
|
-
|
|
|
- if not os.path.exists(fname):
|
|
|
- print("Could not find '{0}'".format(fname))
|
|
|
- return False # We did not complete
|
|
|
-
|
|
|
- print(f"Loading: {fname}")
|
|
|
- fileout = "data/{0}_{1}".format(difficult, x)
|
|
|
- output = subprocess.run(
|
|
|
- ["tesseract", fname, fileout],
|
|
|
- stderr=subprocess.DEVNULL,
|
|
|
- # capture_output=False,
|
|
|
- shell=False,
|
|
|
- )
|
|
|
-
|
|
|
- with open(fileout + ".txt", "r") as fp:
|
|
|
- word = fp.read().strip()
|
|
|
- print(word)
|
|
|
-
|
|
|
- return word # Save this to the dict
|
|
|
-=======
|
|
|
for x in range(0, 70):
|
|
|
fname = image_filename(difficult, x)
|
|
|
|
|
@@ -376,7 +336,6 @@ def autotrain(difficult):
|
|
|
word = fp.read().strip().lower()
|
|
|
key_word[f'{difficult}_{x}'] = word
|
|
|
print(word)
|
|
|
->>>>>>> Stashed changes
|
|
|
|
|
|
|
|
|
# Now to call all the previous functions
|
|
@@ -404,19 +363,9 @@ if args.train:
|
|
|
# Img Processing: Run thru every single category and every single word
|
|
|
wordDict = {}
|
|
|
for level in ["e", "m", "h"]:
|
|
|
-<<<<<<< Updated upstream
|
|
|
- for x in range(0, 66):
|
|
|
- at = autotrain(level, x)
|
|
|
- if(at != False): # If it is complete store it
|
|
|
- wordDict["{0}_{1}".format(level, x)] = at
|
|
|
-
|
|
|
- with open('words.yml', 'w') as f:
|
|
|
- yaml.dump(wordDict, f) # Writes it automatically into the file
|
|
|
-=======
|
|
|
autotrain(level)
|
|
|
with open(args.JSON, 'w') as fp:
|
|
|
json.dump(key_word, fp, sort_keys=True, indent=2)
|
|
|
->>>>>>> Stashed changes
|
|
|
|
|
|
# ----------------------------------------------------------------------------------------
|
|
|
# All below was in a seperate dataJS.py file... but now I have fixed it so it's 1 script!
|