this is based on calsyslab project
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

104 lines
2.7 KiB

1 year ago
1 year ago
  1. __author__ = 'DarkWeb'
  2. '''
  3. Starting point of the Darkweb Mining Platform
  4. '''
  5. import os
  6. from datetime import *
  7. from Forums.BestCardingWorld.crawler_selenium import crawler as crawlerBestCardingWorld
  8. from Forums.CryptBB.crawler_selenium import crawler as crawlerCryptBB
  9. import time
  10. # reads list of marketplaces
  11. def getForums():
  12. forums = []
  13. with open('forumsList.txt') as f:
  14. forums = f.readlines()
  15. return forums
  16. # Creates needed directories for marketplace if doesn't exist
  17. def createDirectory(forum):
  18. # Package should already be there, holding crawler and parser
  19. if forum == 'Reddits':
  20. pagesMainDir = '../' + forum
  21. else:
  22. pagesMainDir = '../' + forum + "/HTML_Pages"
  23. # sharedFolderPath = r'\\VBoxSvr\VM_Files_(shared)'
  24. # pagesMainDir = os.path.join(sharedFolderPath, 'HTML/Forums/' + forum + '/HTML_Pages')
  25. if not os.path.isdir(pagesMainDir):
  26. os.makedirs(pagesMainDir)
  27. if forum == 'Reddits':
  28. createRedditsSubdirectories(pagesMainDir)
  29. else:
  30. createSubdirectories(pagesMainDir)
  31. def createRedditsSubdirectories(pagesMainDir):
  32. with open('../Reddits/redditsList.txt', 'r') as f:
  33. reddits = f.readlines()
  34. for reddit in reddits:
  35. reddit = reddit.strip('\n')
  36. redditMainDir = pagesMainDir + '/' + reddit + '/HTML_Pages'
  37. if not os.path.isdir(redditMainDir):
  38. os.mkdir(redditMainDir)
  39. # Create inner time folders
  40. createSubdirectories(redditMainDir)
  41. def createSubdirectories(pagesDir):
  42. currentDateDir = pagesDir + '/' + str("%02d" %date.today().month) + str("%02d" %date.today().day) + str("%04d" %date.today().year)
  43. if not os.path.isdir(currentDateDir):
  44. os.mkdir(currentDateDir)
  45. listingDir = currentDateDir + '/Listing'
  46. if not os.path.isdir(listingDir):
  47. os.mkdir(listingDir)
  48. listReadDir = listingDir + '/Read'
  49. if not os.path.isdir(listReadDir):
  50. os.mkdir(listReadDir)
  51. descriptionDir = currentDateDir + '/Description'
  52. if not os.path.isdir(descriptionDir):
  53. os.mkdir(descriptionDir)
  54. descReadDir = descriptionDir + '/Read'
  55. if not os.path.isdir(descReadDir):
  56. os.mkdir(descReadDir)
  57. if __name__ == '__main__':
  58. forumsList = getForums()
  59. for forum in forumsList:
  60. forum = forum.replace('\n','')
  61. print("Creating listing and description directories ...")
  62. createDirectory(forum)
  63. time.sleep(5)
  64. input("Directories created successfully. Press ENTER to continue\n")
  65. if forum == "BestCardingWorld":
  66. crawlerBestCardingWorld()
  67. elif forum == "CryptBB":
  68. crawlerCryptBB()
  69. print("Scraping process completed successfully!")