this is based on calsyslab project
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

115 lines
3.1 KiB

1 year ago
1 year ago
1 year ago
1 year ago
1 year ago
1 year ago
1 year ago
1 year ago
1 year ago
1 year ago
  1. __author__ = 'DarkWeb'
  2. '''
  3. Starting point of the Darkweb Mining Platform
  4. '''
  5. import os
  6. from datetime import *
  7. from Forums.BestCardingWorld.crawler_selenium import crawler as crawlerBestCardingWorld
  8. from Forums.CryptBB.crawler_selenium import crawler as crawlerCryptBB
  9. from Forums.OnniForums.crawler_selenium import crawler as crawlerOnniForums
  10. #from Forums.CrackingPro.crawler_selenium import crawler as crawlerCrackingPro
  11. import time
  12. # reads list of marketplaces manually inputted
  13. def getForums():
  14. forums = []
  15. with open('forumsList.txt') as f:
  16. forums = f.readlines()
  17. return forums
  18. # Creates needed directories for marketplace if doesn't exist
  19. def createDirectory(forum):
  20. # Package should already be there, holding crawler and parser
  21. if forum == 'Reddits':
  22. pagesMainDir = '../' + forum
  23. else:
  24. pagesMainDir = '../' + forum + "/HTML_Pages"
  25. # sharedFolderPath = r'\\VBoxSvr\VM_Files_(shared)'
  26. # pagesMainDir = os.path.join(sharedFolderPath, 'HTML/Forums/' + forum + '/HTML_Pages')
  27. if not os.path.isdir(pagesMainDir):
  28. os.makedirs(pagesMainDir)
  29. if forum == 'Reddits':
  30. createRedditsSubdirectories(pagesMainDir)
  31. else:
  32. createSubdirectories(pagesMainDir)
  33. def createRedditsSubdirectories(pagesMainDir):
  34. with open('../Reddits/redditsList.txt', 'r') as f:
  35. reddits = f.readlines()
  36. for reddit in reddits:
  37. reddit = reddit.strip('\n')
  38. redditMainDir = pagesMainDir + '/' + reddit + '/HTML_Pages'
  39. if not os.path.isdir(redditMainDir):
  40. os.mkdir(redditMainDir)
  41. # Create inner time folders
  42. createSubdirectories(redditMainDir)
  43. def createSubdirectories(pagesDir):
  44. currentDateDir = pagesDir + '/' + str("%02d" %date.today().month) + str("%02d" %date.today().day) + str("%04d" %date.today().year)
  45. if not os.path.isdir(currentDateDir):
  46. os.mkdir(currentDateDir)
  47. listingDir = currentDateDir + '/Listing'
  48. if not os.path.isdir(listingDir):
  49. os.mkdir(listingDir)
  50. listReadDir = listingDir + '/Read'
  51. if not os.path.isdir(listReadDir):
  52. os.mkdir(listReadDir)
  53. descriptionDir = currentDateDir + '/Description'
  54. if not os.path.isdir(descriptionDir):
  55. os.mkdir(descriptionDir)
  56. descReadDir = descriptionDir + '/Read'
  57. if not os.path.isdir(descReadDir):
  58. os.mkdir(descReadDir)
  59. #main method
  60. if __name__ == '__main__':
  61. #assignment from forumsList.txt
  62. forumsList = getForums()
  63. #get forum from forumsList
  64. for forum in forumsList:
  65. forum = forum.replace('\n','')
  66. print("Creating listing and description directories ...")
  67. createDirectory(forum)
  68. time.sleep(5) #wait for directories to be created
  69. input("Directories created successfully. Press ENTER to continue\n")
  70. if forum == "BestCardingWorld":
  71. crawlerBestCardingWorld()
  72. elif forum == "CryptBB":
  73. crawlerCryptBB()
  74. elif forum == "OnniForums":
  75. crawlerOnniForums()
  76. elif forum == "CrackingPro":
  77. crawlerCrackingPro()
  78. print("Scraping process completed successfully!")