dataLoad.py 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258
  1. #!/usr/bin/env python3
  2. from PIL import Image
  3. from pprint import pprint
  4. import sys, time, os, requests, random, json, argparse
  5. parser = argparse.ArgumentParser(description='Unknown program that breaks in strange ways.')
  6. parser.add_argument("--download", help="Download Images", action="store_true")
  7. parser.add_argument("JSON", type=str, nargs="?", help="Filename to save results", default="test.js")
  8. args = parser.parse_args()
  9. pprint(args)
  10. # Should we spend the time to download image, and process it? (True = Yes, False = No)
  11. # DOWNLOAD = False
  12. DOWNLOAD = args.download
  13. # Should we add the JSON in a file? (True is filename, False = do not do)
  14. # JSONME = 'test.js'
  15. JSONME = args.JSON
  16. # NOTE: To begin the insert of the JSONIFIED image and word its
  17. # // T
  18. # A JS comment with a uppercase T
  19. # To stop its
  20. # // t
  21. # A JS comment with a lowercase t
  22. # httpbin.org/headers
  23. sess = requests.Session()
  24. head = {'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36'}
  25. sess.headers.update(head)
  26. ON = 'X'
  27. OFF = '.'
  28. DIR = 'data'
  29. INTENSITY = 75
  30. im = ''
  31. pix = [0, 0]
  32. size = [0, 0]
  33. pal = ''
  34. if not os.path.exists('in'):
  35. os.mkdir('in')
  36. if not os.path.exists('data'):
  37. os.mkdir('data')
  38. def download(howhard, index):
  39. global sess
  40. """
  41. Download an image based upon how hard it is.
  42. You print out the return value. Are you returning anything useful??
  43. """
  44. r = sess.get(f'http://s0urce.io/client/img/word/{howhard}/{index}')
  45. if(r.status_code == 200):
  46. with open(f'in/{howhard}_{index}.png', 'wb') as f:
  47. f.write(r.content)
  48. return f'{howhard}_{index}.png ' + str(r.status_code)
  49. return r.status_code
  50. def img_point(x, y):
  51. global pix
  52. return pix[x, y]
  53. def img_avg(x, y):
  54. global im, pal
  55. rgb = img_point(x,y)
  56. if(im.mode == 'P'):
  57. rgb = pal[rgb*3:(rgb+1)*3]
  58. if(im.mode == 'I'):
  59. return rgb >> 8
  60. return int( ( rgb[0] + rgb[1] + rgb[2] ) / 3 )
  61. def is_set(x, y):
  62. global INTENSITY
  63. avg = img_avg(x,y)
  64. return (avg < INTENSITY)
  65. def scan_img():
  66. global sx, sy, ex, ey, total
  67. total = 0
  68. sx = size[0]; ex = 0
  69. sy = size[1]; ey = 0
  70. for y in range( 0,size[1] ):
  71. for x in range( 0,size[0] ):
  72. pnt_is = is_set(x,y)
  73. if (pnt_is):
  74. total += 1
  75. if x < sx:
  76. sx = x
  77. if x > ex:
  78. ex = x
  79. if y < sy:
  80. sy = y
  81. if y > ey:
  82. ey = y
  83. #print (sx,ex,sy,ey)
  84. # give us a little border to work with
  85. if sx > 0:
  86. sx -= 1
  87. if ex < size[0]:
  88. ex += 1
  89. if sy > 0:
  90. sy -= 1
  91. if ey < size[1]:
  92. ey += 1
  93. #print (sx,ex,sy,ey)
  94. return(sx,sy,ex,ey)
  95. def save_image():
  96. result = []
  97. for y in range(sy,ey):
  98. s = ''
  99. for x in range(sx,ex):
  100. if is_set(x,y):
  101. s += ON
  102. else:
  103. s += OFF
  104. result.append(s)
  105. return result
  106. def run(difficult):
  107. for x in range(0, 70):
  108. fname = f'in/{difficult}_{x}.png'
  109. # if os.path.exists() ... :(
  110. try:
  111. with open(fname, 'r') as f:
  112. f = f
  113. except FileNotFoundError:
  114. print("File does not exist")
  115. continue
  116. print(f"Loading: {fname}")
  117. im = Image.open(fname)
  118. pix = im.load()
  119. size = im.size
  120. print(f"Size: {size[0]} x {size[1]}")
  121. if(im.mode == 'P'):
  122. pal = im.getpalette()
  123. sx = 0
  124. ex = size[0]
  125. sy = 0
  126. ey = size[1]
  127. total = 0
  128. scan_img()
  129. print(f"Chars within ({sx}, {sy}) - ({ex}, {ey}) total {total} pixels")
  130. img_s = save_image()
  131. for l in img_s:
  132. print(l)
  133. img_s.append(input('Word: '))
  134. with open(f'{DIR}/{difficult}_{x}.txt', 'w') as f:
  135. for i_s in img_s:
  136. f.write(f'{i_s}\n')
  137. print(f"Image saved to '{DIR}/{difficult}_{x}.txt' in byte string")
  138. # os.remove(f'{fname}') # Grr No bad bean, keep file for error checking
  139. # print(f"File '{fname}' automatically removed")
  140. if (DOWNLOAD == True):
  141. print("Downloading s0urce.io Words")
  142. print("EASY")
  143. # time.sleep(5)
  144. for e in range(0, 62):
  145. print(download('e', e))
  146. # time.sleep(random.randint(10, 15))
  147. print("MEDIUM")
  148. # time.sleep(5)
  149. for m in range(0, 66):
  150. print(download('m', m))
  151. # time.sleep(random.randint(10, 15))
  152. print("HARD")
  153. # time.sleep(5)
  154. for h in range(0, 55):
  155. print(download('h', h))
  156. # time.sleep(random.randint(10, 15))
  157. # Img Processing
  158. run('e') # Answer the questions
  159. run('m')
  160. run('h')
  161. # ----------------------------------------------------------------------------------------
  162. # All below was in a seperate dataJS.py file... but now I have fixed it so it's 1 script!
  163. if (JSONME.lower() != 'false'):
  164. print("Now exporting to JSON")
  165. print(f"Targeting file: '{JSONME}'")
  166. time.sleep(5)
  167. def test(t):
  168. global DIR
  169. fname = f'{DIR}/{t}.txt'
  170. r = []
  171. try:
  172. with open(fname, 'r') as f:
  173. for l in f:
  174. r.append(l.strip())
  175. return r
  176. except FileNotFoundError:
  177. return None
  178. def insertJS(item):
  179. global JSON
  180. item = json.dumps(item)
  181. item = f'{item},'
  182. r = []
  183. try:
  184. with open(f'{JSONME}', 'r') as f:
  185. for l in f:
  186. if l != '':
  187. r.append(l.strip('\n'))
  188. else:
  189. r.append('')
  190. except FileNotFoundError:
  191. print(f"File {JSONME} Not Found!")
  192. sys.exit()
  193. c = 0
  194. for e in r:
  195. if('// T' == e):
  196. temp = r[c+1]
  197. del r[c+1]
  198. r.insert(c+1, item)
  199. r.insert(c+2, temp)
  200. elif('// t' == e):
  201. break
  202. c += 1
  203. with open(f'{JSONME}', 'w') as f:
  204. for e in r:
  205. f.write(f'{e}\n')
  206. for x in range(0, 183):
  207. te = test(x)
  208. if(te != None):
  209. word = te
  210. insertJS(word)
  211. print("Complete")