dataLoad.py 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239
  1. #!/usr/bin/env python3
  2. from PIL import Image
  3. from pprint import pprint
  4. import sys, time, os, requests, random, json
  5. # Should we spend the time to download image, and process it? (True = Yes, False = No)
  6. DOWNLOAD = False
  7. # Should we add the JSON in a file? (True is filename, False = do not do)
  8. JSONME = 'test.js'
  9. # NOTE: To begin the insert of the JSONIFIED image and word its
  10. # // T
  11. # A JS comment with a uppercase T
  12. # To stop its
  13. # // t
  14. # A JS comment with a lowercase t
  15. # httpbin.org/headers
  16. S = requests.Session()
  17. head = {'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.95 Safari/537.36'}
  18. S.headers.update(head)
  19. ON = 'X'
  20. OFF = '.'
  21. DIR = 'data'
  22. INTENSITY = 75
  23. im = ''
  24. pix = [0, 0]
  25. size = [0, 0]
  26. pal = ''
  27. def download(o, i):
  28. global S
  29. r = S.get(f'http://s0urce.io/client/img/word/{o}/{i}')
  30. if(r.status_code == 200):
  31. with open(f'in/{i}.png', 'wb') as f:
  32. f.write(r.content)
  33. return f'{i}.png ' + str(r.status_code)
  34. return r.status_code
  35. def img_point(x, y):
  36. global pix
  37. return pix[x, y]
  38. def img_avg(x, y):
  39. global im, pal
  40. rgb = img_point(x,y)
  41. if(im.mode == 'P'):
  42. rgb = pal[rgb*3:(rgb+1)*3]
  43. if(im.mode == 'I'):
  44. return rgb >> 8
  45. return int( ( rgb[0] + rgb[1] + rgb[2] ) / 3 )
  46. def is_set(x, y):
  47. global INTENSITY
  48. avg = img_avg(x,y)
  49. return (avg < INTENSITY)
  50. def scan_img():
  51. global sx, sy, ex, ey, total
  52. total = 0
  53. sx = size[0]; ex = 0
  54. sy = size[1]; ey = 0
  55. for y in range( 0,size[1] ):
  56. for x in range( 0,size[0] ):
  57. pnt_is = is_set(x,y)
  58. if (pnt_is):
  59. total += 1
  60. if x < sx:
  61. sx = x
  62. if x > ex:
  63. ex = x
  64. if y < sy:
  65. sy = y
  66. if y > ey:
  67. ey = y
  68. #print (sx,ex,sy,ey)
  69. # give us a little border to work with
  70. if sx > 0:
  71. sx -= 1
  72. if ex < size[0]:
  73. ex += 1
  74. if sy > 0:
  75. sy -= 1
  76. if ey < size[1]:
  77. ey += 1
  78. #print (sx,ex,sy,ey)
  79. return(sx,sy,ex,ey)
  80. def save_image():
  81. result = []
  82. for y in range(sy,ey):
  83. s = ''
  84. for x in range(sx,ex):
  85. if is_set(x,y):
  86. s += ON
  87. else:
  88. s += OFF
  89. result.append(s)
  90. return result
  91. def run(VAL):
  92. for x in range(0, 70):
  93. fname = f'in/{x}.png'
  94. try:
  95. with open(fname, 'r') as f:
  96. f = f
  97. except FileNotFoundError:
  98. print("File does not exist")
  99. continue
  100. print(f"Loading: {fname}")
  101. im = Image.open(fname)
  102. pix = im.load()
  103. size = im.size
  104. print(f"Size: {size[0]} x {size[1]}")
  105. if(im.mode == 'P'):
  106. pal = im.getpalette()
  107. sx = 0
  108. ex = size[0]
  109. sy = 0
  110. ey = size[1]
  111. total = 0
  112. scan_img()
  113. print(f"Chars within ({sx}, {sy}) - ({ex}, {ey}) total {total} pixels")
  114. img_s = save_image()
  115. for l in img_s:
  116. print(l)
  117. img_s.append(input('Word: '))
  118. y = x + VAL
  119. with open(f'{DIR}/{y}.txt', 'w') as f:
  120. for i_s in img_s:
  121. f.write(f'{i_s}\n')
  122. print(f"Image saved to '{DIR}/{y}.txt' in byte string")
  123. os.remove(f'{fname}')
  124. print(f"File '{fname}' automatically removed")
  125. if(DOWNLOAD == True):
  126. print("Downloading s0urce.io Words")
  127. print("EASY")
  128. time.sleep(5)
  129. for e in range(0, 62):
  130. print(download('e', e))
  131. time.sleep(random.randint(10, 15))
  132. run(0)
  133. print("MEDIUM")
  134. time.sleep(5)
  135. for m in range(0, 66):
  136. print(download('m', m))
  137. time.sleep(random.randint(10, 15))
  138. run(62)
  139. print("HARD")
  140. time.sleep(5)
  141. for h in range(0, 55):
  142. print(download('h', h))
  143. time.sleep(random.randint(10, 15))
  144. run(128)
  145. # ----------------------------------------------------------------------------------------
  146. # All below was in a seperate dataJS.py file... but now I have fixed it so it's 1 script!
  147. if(JSONME.lower() != 'false'):
  148. print("Now exporting to JSON")
  149. print(f"Targeting file: '{JSONME}'")
  150. time.sleep(5)
  151. def test(t):
  152. global DIR
  153. fname = f'{DIR}/{t}.txt'
  154. r = []
  155. try:
  156. with open(fname, 'r') as f:
  157. for l in f:
  158. r.append(l.strip())
  159. return r
  160. except FileNotFoundError:
  161. return None
  162. def insertJS(item):
  163. global JSON
  164. item = json.dumps(item)
  165. item = f'{item},'
  166. r = []
  167. try:
  168. with open(f'{JSONME}', 'r') as f:
  169. for l in f:
  170. if l != '':
  171. r.append(l.strip('\n'))
  172. else:
  173. r.append('')
  174. except FileNotFoundError:
  175. print(f"File {JSONME} Not Found!")
  176. sys.exit()
  177. c = 0
  178. for e in r:
  179. if('// T' == e):
  180. temp = r[c+1]
  181. del r[c+1]
  182. r.insert(c+1, item)
  183. r.insert(c+2, temp)
  184. elif('// t' == e):
  185. break
  186. c += 1
  187. with open(f'{JSONME}', 'w') as f:
  188. for e in r:
  189. f.write(f'{e}\n')
  190. for x in range(0, 183):
  191. te = test(x)
  192. if(te != None):
  193. word = te
  194. insertJS(word)
  195. print("Complete")