dataLoad.py 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260
  1. #!/usr/bin/env python3
  2. from PIL import Image
  3. from pprint import pprint
  4. import sys, time, os, requests, random, json, argparse
  5. parser = argparse.ArgumentParser(description='Unknown program that breaks in strange ways.')
  6. parser.add_argument("--download", help="Download Images", action="store_true")
  7. parser.add_argument("JSON", type=str, nargs="?", help="Filename to save results", default="test.js")
  8. args = parser.parse_args()
  9. pprint(args)
  10. # Should we spend the time to download image, and process it? (True = Yes, False = No)
  11. # DOWNLOAD = False
  12. DOWNLOAD = args.download
  13. # Should we add the JSON in a file? (True is filename, False = do not do)
  14. # JSONME = 'test.js'
  15. JSONME = args.JSON
  16. # NOTE: To begin the insert of the JSONIFIED image and word its
  17. # // T
  18. # A JS comment with a uppercase T
  19. # To stop its
  20. # // t
  21. # A JS comment with a lowercase t
  22. # httpbin.org/headers
  23. sess = requests.Session()
  24. head = {'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36'}
  25. sess.headers.update(head)
  26. ON = 'X'
  27. OFF = '.'
  28. DIR = 'data'
  29. INTENSITY = 75
  30. im = ''
  31. pix = [0, 0]
  32. size = [0, 0]
  33. pal = ''
  34. if not os.path.exists('in'):
  35. os.mkdir('in')
  36. if not os.path.exists('data'):
  37. os.mkdir('data')
  38. def download(howhard, index):
  39. global sess
  40. """
  41. Download an image based upon how hard it is.
  42. You print out the return value. Are you returning anything useful??
  43. """
  44. r = sess.get(f'http://s0urce.io/client/img/word/{howhard}/{index}')
  45. if(r.status_code == 200):
  46. with open(f'in/{howhard}_{index}.png', 'wb') as f:
  47. f.write(r.content)
  48. return f'{howhard}_{index}.png ' + str(r.status_code)
  49. return r.status_code
  50. def img_point(x, y):
  51. global pix
  52. return pix[x, y]
  53. def img_avg(x, y):
  54. global im, pal
  55. rgb = img_point(x,y)
  56. if(im.mode == 'P'):
  57. rgb = pal[rgb*3:(rgb+1)*3]
  58. if(im.mode == 'I'):
  59. return rgb >> 8
  60. return int( ( rgb[0] + rgb[1] + rgb[2] ) / 3 )
  61. def is_set(x, y):
  62. global INTENSITY
  63. avg = img_avg(x,y)
  64. return (avg < INTENSITY)
  65. def scan_img():
  66. global sx, sy, ex, ey, total
  67. total = 0
  68. sx = size[0]; ex = 0
  69. sy = size[1]; ey = 0
  70. for y in range( 0,size[1] ):
  71. for x in range( 0,size[0] ):
  72. pnt_is = is_set(x,y)
  73. if (pnt_is):
  74. total += 1
  75. if x < sx:
  76. sx = x
  77. if x > ex:
  78. ex = x
  79. if y < sy:
  80. sy = y
  81. if y > ey:
  82. ey = y
  83. #print (sx,ex,sy,ey)
  84. # give us a little border to work with
  85. if sx > 0:
  86. sx -= 1
  87. if ex < size[0]:
  88. ex += 1
  89. if sy > 0:
  90. sy -= 1
  91. if ey < size[1]:
  92. ey += 1
  93. #print (sx,ex,sy,ey)
  94. return(sx,sy,ex,ey)
  95. def save_image():
  96. result = []
  97. for y in range(sy,ey):
  98. s = ''
  99. for x in range(sx,ex):
  100. if is_set(x,y):
  101. s += ON
  102. else:
  103. s += OFF
  104. result.append(s)
  105. return result
  106. def run(difficult):
  107. global size, pix, im
  108. for x in range(0, 70):
  109. fname = f'in/{difficult}_{x}.png'
  110. # if os.path.exists() ... :(
  111. try:
  112. with open(fname, 'r') as f:
  113. f = f
  114. except FileNotFoundError:
  115. print("File does not exist")
  116. continue
  117. print(f"Loading: {fname}")
  118. im = Image.open(fname)
  119. pix = im.load()
  120. size = im.size
  121. print(f"Size: {size[0]} x {size[1]}")
  122. if(im.mode == 'P'):
  123. pal = im.getpalette()
  124. sx = 0
  125. ex = size[0]
  126. sy = 0
  127. ey = size[1]
  128. total = 0
  129. scan_img()
  130. print(f"Chars within ({sx}, {sy}) - ({ex}, {ey}) total {total} pixels")
  131. img_s = save_image()
  132. for l in img_s:
  133. print(l)
  134. img_s.append(input('Word: '))
  135. with open(f'{DIR}/{difficult}_{x}.txt', 'w') as f:
  136. for i_s in img_s:
  137. f.write(f'{i_s}\n')
  138. print(f"Image saved to '{DIR}/{difficult}_{x}.txt' in byte string")
  139. # os.remove(f'{fname}') # Grr No bad bean, keep file for error checking
  140. # print(f"File '{fname}' automatically removed")
  141. if (DOWNLOAD == True):
  142. print("Downloading s0urce.io Words")
  143. print("EASY")
  144. # time.sleep(5)
  145. for e in range(0, 62):
  146. print(download('e', e))
  147. # time.sleep(random.randint(10, 15))
  148. print("MEDIUM")
  149. # time.sleep(5)
  150. for m in range(0, 66):
  151. print(download('m', m))
  152. # time.sleep(random.randint(10, 15))
  153. print("HARD")
  154. # time.sleep(5)
  155. for h in range(0, 55):
  156. print(download('h', h))
  157. # time.sleep(random.randint(10, 15))
  158. # Img Processing
  159. run('e') # Answer the questions
  160. run('m')
  161. run('h')
  162. # ----------------------------------------------------------------------------------------
  163. # All below was in a seperate dataJS.py file... but now I have fixed it so it's 1 script!
  164. if (JSONME.lower() != 'false'):
  165. print("Now exporting to JSON")
  166. print(f"Targeting file: '{JSONME}'")
  167. time.sleep(5)
  168. def test(t):
  169. global DIR
  170. fname = f'{DIR}/{t}.txt'
  171. r = []
  172. try:
  173. with open(fname, 'r') as f:
  174. for l in f:
  175. r.append(l.strip())
  176. return r
  177. except FileNotFoundError:
  178. return None
  179. def insertJS(item):
  180. global JSON
  181. item = json.dumps(item)
  182. item = f'{item},'
  183. r = []
  184. try:
  185. with open(f'{JSONME}', 'r') as f:
  186. for l in f:
  187. if l != '':
  188. r.append(l.strip('\n'))
  189. else:
  190. r.append('')
  191. except FileNotFoundError:
  192. print(f"File {JSONME} Not Found!")
  193. sys.exit()
  194. c = 0
  195. for e in r:
  196. if('// T' == e):
  197. temp = r[c+1]
  198. del r[c+1]
  199. r.insert(c+1, item)
  200. r.insert(c+2, temp)
  201. elif('// t' == e):
  202. break
  203. c += 1
  204. with open(f'{JSONME}', 'w') as f:
  205. for e in r:
  206. f.write(f'{e}\n')
  207. for x in range(0, 183):
  208. te = test(x)
  209. if(te != None):
  210. word = te
  211. insertJS(word)
  212. print("Complete")