crack.py 5.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159
  1. #!/usr/bin/python
  2. # -*- coding: iso-8859-15 -*-
  3. """
  4. This file is part of the cintruder project, http://cintruder.03c8.net
  5. Copyright (c) 2012/2016 psy <epsylon@riseup.net>
  6. cintruder is free software; you can redistribute it and/or modify it under
  7. the terms of the GNU General Public License as published by the Free
  8. Software Foundation version 3 of the License.
  9. cintruder is distributed in the hope that it will be useful, but WITHOUT ANY
  10. WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
  11. FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
  12. details.
  13. You should have received a copy of the GNU General Public License along
  14. with cintruder; if not, write to the Free Software Foundation, Inc., 51
  15. Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
  16. """
  17. from PIL import Image
  18. import hashlib, os, math, time
  19. import shutil
  20. class VectorCompare:
  21. def magnitude(self, concordance):
  22. total = 0
  23. for word, count in concordance.iteritems():
  24. # print concordance
  25. total += count ** 2
  26. return math.sqrt(total)
  27. def relation(self, concordance1, concordance2):
  28. topvalue = 0
  29. for word, count in concordance1.iteritems():
  30. if concordance2.has_key(word):
  31. topvalue += count * concordance2[word]
  32. return topvalue / (self.magnitude(concordance1) * self.magnitude(concordance2))
  33. class CIntruderCrack(object):
  34. """
  35. Class to bruteforce captchas
  36. """
  37. def __init__(self, captcha=""):
  38. """
  39. Initialize main CIntruder
  40. """
  41. self.captcha = self.set_captcha(captcha)
  42. start = time.time()
  43. if not os.path.exists("core/images/previews/"):
  44. os.mkdir("core/images/previews/")
  45. else:
  46. shutil.rmtree("core/images/previews/")
  47. os.mkdir("core/images/previews/")
  48. def buildvector(self, im):
  49. d1 = {}
  50. count = 0
  51. for i in im.getdata():
  52. d1[count] = i
  53. count += 1
  54. return d1
  55. def set_captcha(self, captcha):
  56. """
  57. Set the captcha.
  58. """
  59. self.captcha = captcha
  60. return captcha
  61. def crack(self, options):
  62. v = VectorCompare()
  63. path, dirs, files = os.walk("dictionary/").next()
  64. dictionary = dirs
  65. imageset = []
  66. last_letter = None
  67. print "\n[Info] Loading dictionary...\n"
  68. for letter in dictionary:
  69. for img in os.listdir('dictionary/'+letter):
  70. temp = []
  71. temp.append(self.buildvector(Image.open("dictionary/%s/%s"%(letter, img))))
  72. imageset.append({letter:temp})
  73. try:
  74. im = Image.open(self.captcha)
  75. im.save("core/images/previews/last-preview.gif")
  76. im2 = Image.new("P", im.size, 255)
  77. im = im.convert("P")
  78. except:
  79. print "\nError during cracking!. Is that captcha supported?\n"
  80. return
  81. temp = {}
  82. for x in range(im.size[1]):
  83. for y in range(im.size[0]):
  84. pix = im.getpixel((y, x))
  85. temp[pix] = pix
  86. if pix == 3: # pixel colour id
  87. im2.putpixel((y, x), 0)
  88. inletter = False
  89. foundletter = False
  90. start = 0
  91. end = 0
  92. letters = []
  93. for y in range(im2.size[0]): # slice across
  94. for x in range(im2.size[1]): # slice down
  95. pix = im2.getpixel((y, x))
  96. if pix != 255:
  97. inletter = True
  98. if foundletter == False and inletter == True:
  99. foundletter = True
  100. start = y
  101. if foundletter == True and inletter == False:
  102. foundletter = False
  103. end = y
  104. letters.append((start, end))
  105. inletter = False
  106. count = 0
  107. countid = 1
  108. word_sug = None
  109. end = time.time()
  110. elapsed = end - start
  111. words = {}
  112. for letter in letters:
  113. m = hashlib.md5()
  114. im3 = im2.crop((letter[0], 0, letter[1], im2.size[1]))
  115. guess = []
  116. for image in imageset:
  117. for x, y in image.iteritems():
  118. if len(y) != 0:
  119. guess.append(( v.relation(y[0], self.buildvector(im3)), x))
  120. guess.sort(reverse=True)
  121. word_per = guess[0][0] * 100
  122. if str(word_per) == "100.0":
  123. print "Image position :", countid
  124. print "Broken Percent :", int(round(float(word_per))), "%", "[+CRACKED!]"
  125. words[countid] = guess[0][1]
  126. else:
  127. print "Image position :", countid
  128. print "Broken Percent :", "%.4f" % word_per, "%"
  129. words[countid] = "_"
  130. print "Word suggested :", guess[0][1]
  131. print "-------------------"
  132. if word_sug == None:
  133. word_sug = str(guess[0][1])
  134. else:
  135. word_sug = word_sug + str(guess[0][1])
  136. count += 1
  137. countid = countid + 1
  138. print "\n========================================"
  139. if options.verbose:
  140. print "[Info] Elapsed OCR time :", elapsed
  141. print "========================================"
  142. if word_sug is None:
  143. print "Suggested Solution: ", "[ No idea!. Try to add more images to your dictionary/]"
  144. else:
  145. print "Cracked Words: ", words.values()
  146. print "Suggested Solution: ", "[", word_sug, "]"
  147. print "========================================\n"
  148. return word_sug