dataLoad.py 6.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259
  1. #!/usr/bin/env python3
  2. from PIL import Image
  3. from pprint import pprint
  4. import sys, time, os, requests, random, json, argparse
  5. parser = argparse.ArgumentParser(description='Unknown program that breaks in strange ways.')
  6. parser.add_argument("--download", help="Download Images", action="store_true")
  7. parser.add_argument("JSON", type=str, nargs="?", help="Filename to save results", default="test.js")
  8. args = parser.parse_args()
  9. pprint(args)
  10. # Should we spend the time to download image, and process it? (True = Yes, False = No)
  11. # DOWNLOAD = False
  12. DOWNLOAD = args.download
  13. # Should we add the JSON in a file? (True is filename, False = do not do)
  14. # JSONME = 'test.js'
  15. JSONME = args.JSON
  16. # NOTE: To begin the insert of the JSONIFIED image and word its
  17. # // T
  18. # A JS comment with a uppercase T
  19. # To stop its
  20. # // t
  21. # A JS comment with a lowercase t
  22. # httpbin.org/headers
  23. sess = requests.Session()
  24. head = {'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36'}
  25. sess.headers.update(head)
  26. ON = 'X'
  27. OFF = '.'
  28. DIR = 'data'
  29. INTENSITY = 75
  30. im = ''
  31. pix = [0, 0]
  32. size = [0, 0]
  33. pal = ''
  34. if not os.path.exists('in'):
  35. os.mkdir('in')
  36. def download(howhard, index):
  37. global sess
  38. """
  39. Download an image based upon how hard it is.
  40. Note: This sucks, because it overwrites images.
  41. Why not save the images and how hard?
  42. Quit running your script on floppy disks!
  43. """
  44. r = sess.get(f'http://s0urce.io/client/img/word/{howhard}/{index}')
  45. if(r.status_code == 200):
  46. with open(f'in/{index}.png', 'wb') as f:
  47. f.write(r.content)
  48. return f'{index}.png ' + str(r.status_code)
  49. return r.status_code
  50. def img_point(x, y):
  51. global pix
  52. return pix[x, y]
  53. def img_avg(x, y):
  54. global im, pal
  55. rgb = img_point(x,y)
  56. if(im.mode == 'P'):
  57. rgb = pal[rgb*3:(rgb+1)*3]
  58. if(im.mode == 'I'):
  59. return rgb >> 8
  60. return int( ( rgb[0] + rgb[1] + rgb[2] ) / 3 )
  61. def is_set(x, y):
  62. global INTENSITY
  63. avg = img_avg(x,y)
  64. return (avg < INTENSITY)
  65. def scan_img():
  66. global sx, sy, ex, ey, total
  67. total = 0
  68. sx = size[0]; ex = 0
  69. sy = size[1]; ey = 0
  70. for y in range( 0,size[1] ):
  71. for x in range( 0,size[0] ):
  72. pnt_is = is_set(x,y)
  73. if (pnt_is):
  74. total += 1
  75. if x < sx:
  76. sx = x
  77. if x > ex:
  78. ex = x
  79. if y < sy:
  80. sy = y
  81. if y > ey:
  82. ey = y
  83. #print (sx,ex,sy,ey)
  84. # give us a little border to work with
  85. if sx > 0:
  86. sx -= 1
  87. if ex < size[0]:
  88. ex += 1
  89. if sy > 0:
  90. sy -= 1
  91. if ey < size[1]:
  92. ey += 1
  93. #print (sx,ex,sy,ey)
  94. return(sx,sy,ex,ey)
  95. def save_image():
  96. result = []
  97. for y in range(sy,ey):
  98. s = ''
  99. for x in range(sx,ex):
  100. if is_set(x,y):
  101. s += ON
  102. else:
  103. s += OFF
  104. result.append(s)
  105. return result
  106. def run(VAL):
  107. for x in range(0, 70):
  108. fname = f'in/{x}.png'
  109. try:
  110. with open(fname, 'r') as f:
  111. f = f
  112. except FileNotFoundError:
  113. print("File does not exist")
  114. continue
  115. print(f"Loading: {fname}")
  116. im = Image.open(fname)
  117. pix = im.load()
  118. size = im.size
  119. print(f"Size: {size[0]} x {size[1]}")
  120. if(im.mode == 'P'):
  121. pal = im.getpalette()
  122. sx = 0
  123. ex = size[0]
  124. sy = 0
  125. ey = size[1]
  126. total = 0
  127. scan_img()
  128. print(f"Chars within ({sx}, {sy}) - ({ex}, {ey}) total {total} pixels")
  129. img_s = save_image()
  130. for l in img_s:
  131. print(l)
  132. img_s.append(input('Word: '))
  133. y = x + VAL
  134. with open(f'{DIR}/{y}.txt', 'w') as f:
  135. for i_s in img_s:
  136. f.write(f'{i_s}\n')
  137. print(f"Image saved to '{DIR}/{y}.txt' in byte string")
  138. os.remove(f'{fname}')
  139. print(f"File '{fname}' automatically removed")
  140. if (DOWNLOAD == True):
  141. print("Downloading s0urce.io Words")
  142. print("EASY")
  143. time.sleep(5)
  144. for e in range(0, 62):
  145. print(download('e', e))
  146. # time.sleep(random.randint(10, 15))
  147. run(0)
  148. print("MEDIUM")
  149. # time.sleep(5)
  150. for m in range(0, 66):
  151. print(download('m', m))
  152. # time.sleep(random.randint(10, 15))
  153. run(62)
  154. print("HARD")
  155. # time.sleep(5)
  156. for h in range(0, 55):
  157. print(download('h', h))
  158. # time.sleep(random.randint(10, 15))
  159. run(128)
  160. # ----------------------------------------------------------------------------------------
  161. # All below was in a seperate dataJS.py file... but now I have fixed it so it's 1 script!
  162. if (JSONME.lower() != 'false'):
  163. print("Now exporting to JSON")
  164. print(f"Targeting file: '{JSONME}'")
  165. time.sleep(5)
  166. def test(t):
  167. global DIR
  168. fname = f'{DIR}/{t}.txt'
  169. r = []
  170. try:
  171. with open(fname, 'r') as f:
  172. for l in f:
  173. r.append(l.strip())
  174. return r
  175. except FileNotFoundError:
  176. return None
  177. def insertJS(item):
  178. global JSON
  179. item = json.dumps(item)
  180. item = f'{item},'
  181. r = []
  182. try:
  183. with open(f'{JSONME}', 'r') as f:
  184. for l in f:
  185. if l != '':
  186. r.append(l.strip('\n'))
  187. else:
  188. r.append('')
  189. except FileNotFoundError:
  190. print(f"File {JSONME} Not Found!")
  191. sys.exit()
  192. c = 0
  193. for e in r:
  194. if('// T' == e):
  195. temp = r[c+1]
  196. del r[c+1]
  197. r.insert(c+1, item)
  198. r.insert(c+2, temp)
  199. elif('// t' == e):
  200. break
  201. c += 1
  202. with open(f'{JSONME}', 'w') as f:
  203. for e in r:
  204. f.write(f'{e}\n')
  205. for x in range(0, 183):
  206. te = test(x)
  207. if(te != None):
  208. word = te
  209. insertJS(word)
  210. print("Complete")