dataLoad.py 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259
  1. #!/usr/bin/env python3
  2. from PIL import Image
  3. from pprint import pprint
  4. import sys, time, os, requests, random, json, argparse
  5. parser = argparse.ArgumentParser(description='Unknown program that breaks in strange ways.')
  6. parser.add_argument("--download", help="Download Images", action="store_true")
  7. parser.add_argument("JSON", type=str, nargs="?", help="Filename to save results", default="test.js")
  8. args = parser.parse_args()
  9. pprint(args)
  10. # Should we spend the time to download image, and process it? (True = Yes, False = No)
  11. # DOWNLOAD = False
  12. DOWNLOAD = args.download
  13. # Should we add the JSON in a file? (True is filename, False = do not do)
  14. # JSONME = 'test.js'
  15. JSONME = args.JSON
  16. # NOTE: To begin the insert of the JSONIFIED image and word its
  17. # // T
  18. # A JS comment with a uppercase T
  19. # To stop its
  20. # // t
  21. # A JS comment with a lowercase t
  22. # httpbin.org/headers
  23. sess = requests.Session()
  24. head = {'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36'}
  25. sess.headers.update(head)
  26. ON = 'X'
  27. OFF = '.'
  28. DIR = 'data'
  29. INTENSITY = 75
  30. im = ''
  31. pix = [0, 0]
  32. size = [0, 0]
  33. pal = ''
  34. if not os.path.exists('in'):
  35. os.mkdir('in')
  36. if not os.path.exists('data'):
  37. os.mkdir('data')
  38. def download(howhard, index):
  39. global sess
  40. """
  41. Download an image based upon how hard it is.
  42. Note: This sucks, because it overwrites images.
  43. Why not save the images and how hard?
  44. Quit running your script on floppy disks!
  45. """
  46. r = sess.get(f'http://s0urce.io/client/img/word/{howhard}/{index}')
  47. if(r.status_code == 200):
  48. with open(f'in/{howhard}_{index}.png', 'wb') as f:
  49. f.write(r.content)
  50. return f'{howhard}_{index}.png ' + str(r.status_code)
  51. return r.status_code
  52. def img_point(x, y):
  53. global pix
  54. return pix[x, y]
  55. def img_avg(x, y):
  56. global im, pal
  57. rgb = img_point(x,y)
  58. if(im.mode == 'P'):
  59. rgb = pal[rgb*3:(rgb+1)*3]
  60. if(im.mode == 'I'):
  61. return rgb >> 8
  62. return int( ( rgb[0] + rgb[1] + rgb[2] ) / 3 )
  63. def is_set(x, y):
  64. global INTENSITY
  65. avg = img_avg(x,y)
  66. return (avg < INTENSITY)
  67. def scan_img():
  68. global sx, sy, ex, ey, total
  69. total = 0
  70. sx = size[0]; ex = 0
  71. sy = size[1]; ey = 0
  72. for y in range( 0,size[1] ):
  73. for x in range( 0,size[0] ):
  74. pnt_is = is_set(x,y)
  75. if (pnt_is):
  76. total += 1
  77. if x < sx:
  78. sx = x
  79. if x > ex:
  80. ex = x
  81. if y < sy:
  82. sy = y
  83. if y > ey:
  84. ey = y
  85. #print (sx,ex,sy,ey)
  86. # give us a little border to work with
  87. if sx > 0:
  88. sx -= 1
  89. if ex < size[0]:
  90. ex += 1
  91. if sy > 0:
  92. sy -= 1
  93. if ey < size[1]:
  94. ey += 1
  95. #print (sx,ex,sy,ey)
  96. return(sx,sy,ex,ey)
  97. def save_image():
  98. result = []
  99. for y in range(sy,ey):
  100. s = ''
  101. for x in range(sx,ex):
  102. if is_set(x,y):
  103. s += ON
  104. else:
  105. s += OFF
  106. result.append(s)
  107. return result
  108. def run(difficult):
  109. for x in range(0, 70):
  110. fname = f'in/{difficult}_{x}.png'
  111. try:
  112. with open(fname, 'r') as f:
  113. f = f
  114. except FileNotFoundError:
  115. print("File does not exist")
  116. continue
  117. print(f"Loading: {fname}")
  118. im = Image.open(fname)
  119. pix = im.load()
  120. size = im.size
  121. print(f"Size: {size[0]} x {size[1]}")
  122. if(im.mode == 'P'):
  123. pal = im.getpalette()
  124. sx = 0
  125. ex = size[0]
  126. sy = 0
  127. ey = size[1]
  128. total = 0
  129. scan_img()
  130. print(f"Chars within ({sx}, {sy}) - ({ex}, {ey}) total {total} pixels")
  131. img_s = save_image()
  132. for l in img_s:
  133. print(l)
  134. img_s.append(input('Word: '))
  135. with open(f'{DIR}/{difficult}_{x}.txt', 'w') as f:
  136. for i_s in img_s:
  137. f.write(f'{i_s}\n')
  138. print(f"Image saved to '{DIR}/{difficult}_{x}.txt' in byte string")
  139. # os.remove(f'{fname}') # Grr No bad bean, keep file for error checking
  140. # print(f"File '{fname}' automatically removed")
  141. if (DOWNLOAD == True):
  142. print("Downloading s0urce.io Words")
  143. print("EASY")
  144. # time.sleep(5)
  145. for e in range(0, 62):
  146. print(download('e', e))
  147. # time.sleep(random.randint(10, 15))
  148. print("MEDIUM")
  149. # time.sleep(5)
  150. for m in range(0, 66):
  151. print(download('m', m))
  152. # time.sleep(random.randint(10, 15))
  153. print("HARD")
  154. # time.sleep(5)
  155. for h in range(0, 55):
  156. print(download('h', h))
  157. # time.sleep(random.randint(10, 15))
  158. # Img Processing
  159. run('e') # Answer the questions
  160. run('m')
  161. run('h')
  162. # ----------------------------------------------------------------------------------------
  163. # All below was in a seperate dataJS.py file... but now I have fixed it so it's 1 script!
  164. if (JSONME.lower() != 'false'):
  165. print("Now exporting to JSON")
  166. print(f"Targeting file: '{JSONME}'")
  167. time.sleep(5)
  168. def test(t):
  169. global DIR
  170. fname = f'{DIR}/{t}.txt'
  171. r = []
  172. try:
  173. with open(fname, 'r') as f:
  174. for l in f:
  175. r.append(l.strip())
  176. return r
  177. except FileNotFoundError:
  178. return None
  179. def insertJS(item):
  180. global JSON
  181. item = json.dumps(item)
  182. item = f'{item},'
  183. r = []
  184. try:
  185. with open(f'{JSONME}', 'r') as f:
  186. for l in f:
  187. if l != '':
  188. r.append(l.strip('\n'))
  189. else:
  190. r.append('')
  191. except FileNotFoundError:
  192. print(f"File {JSONME} Not Found!")
  193. sys.exit()
  194. c = 0
  195. for e in r:
  196. if('// T' == e):
  197. temp = r[c+1]
  198. del r[c+1]
  199. r.insert(c+1, item)
  200. r.insert(c+2, temp)
  201. elif('// t' == e):
  202. break
  203. c += 1
  204. with open(f'{JSONME}', 'w') as f:
  205. for e in r:
  206. f.write(f'{e}\n')
  207. for x in range(0, 183):
  208. te = test(x)
  209. if(te != None):
  210. word = te
  211. insertJS(word)
  212. print("Complete")