Browse Source

fixed merge conflicts

main
Khoi 1 year ago
parent
commit
ac80489d4a
35 changed files with 18 additions and 22 deletions
  1. BIN
      Forums/BestCardingWorld/__pycache__/__init__.cpython-311.pyc
  2. BIN
      Forums/BestCardingWorld/__pycache__/crawler_selenium.cpython-310.pyc
  3. BIN
      Forums/BestCardingWorld/__pycache__/crawler_selenium.cpython-311.pyc
  4. BIN
      Forums/BestCardingWorld/__pycache__/parser.cpython-310.pyc
  5. BIN
      Forums/BestCardingWorld/__pycache__/parser.cpython-311.pyc
  6. BIN
      Forums/Classifier/__pycache__/__init__.cpython-310.pyc
  7. BIN
      Forums/Classifier/__pycache__/__init__.cpython-311.pyc
  8. BIN
      Forums/Classifier/__pycache__/classify_product.cpython-310.pyc
  9. BIN
      Forums/Classifier/__pycache__/classify_product.cpython-311.pyc
  10. BIN
      Forums/Classifier/__pycache__/transformer.cpython-310.pyc
  11. BIN
      Forums/Classifier/__pycache__/transformer.cpython-311.pyc
  12. BIN
      Forums/DB_Connection/__pycache__/__init__.cpython-310.pyc
  13. BIN
      Forums/DB_Connection/__pycache__/__init__.cpython-311.pyc
  14. BIN
      Forums/DB_Connection/__pycache__/db_connection.cpython-310.pyc
  15. BIN
      Forums/DB_Connection/__pycache__/db_connection.cpython-311.pyc
  16. BIN
      Forums/Utilities/__pycache__/__init__.cpython-310.pyc
  17. BIN
      Forums/Utilities/__pycache__/__init__.cpython-311.pyc
  18. BIN
      Forums/Utilities/__pycache__/utilities.cpython-310.pyc
  19. BIN
      Forums/Utilities/__pycache__/utilities.cpython-311.pyc
  20. BIN
      Forums/__pycache__/__init__.cpython-310.pyc
  21. BIN
      Forums/__pycache__/__init__.cpython-311.pyc
  22. BIN
      MarketPlaces/BlackPyramid/__pycache__/crawler_selenium.cpython-310.pyc
  23. BIN
      MarketPlaces/BlackPyramid/__pycache__/parser.cpython-310.pyc
  24. BIN
      MarketPlaces/Classifier/__pycache__/__init__.cpython-310.pyc
  25. BIN
      MarketPlaces/Classifier/__pycache__/__init__.cpython-311.pyc
  26. BIN
      MarketPlaces/Classifier/__pycache__/classify_product.cpython-310.pyc
  27. BIN
      MarketPlaces/Classifier/__pycache__/classify_product.cpython-311.pyc
  28. BIN
      MarketPlaces/Classifier/__pycache__/transformer.cpython-310.pyc
  29. BIN
      MarketPlaces/Classifier/__pycache__/transformer.cpython-311.pyc
  30. +12
    -12
      MarketPlaces/DarkMatter/crawler_selenium.py
  31. +1
    -1
      MarketPlaces/Initialization/marketsList.txt
  32. +3
    -7
      MarketPlaces/Initialization/prepare_parser.py
  33. +2
    -2
      MarketPlaces/M00nkeyMarket/crawler_selenium.py
  34. BIN
      MarketPlaces/__pycache__/__init__.cpython-310.pyc
  35. BIN
      MarketPlaces/__pycache__/__init__.cpython-311.pyc

BIN
Forums/BestCardingWorld/__pycache__/__init__.cpython-311.pyc View File


BIN
Forums/BestCardingWorld/__pycache__/crawler_selenium.cpython-310.pyc View File


BIN
Forums/BestCardingWorld/__pycache__/crawler_selenium.cpython-311.pyc View File


BIN
Forums/BestCardingWorld/__pycache__/parser.cpython-310.pyc View File


BIN
Forums/BestCardingWorld/__pycache__/parser.cpython-311.pyc View File


BIN
Forums/Classifier/__pycache__/__init__.cpython-310.pyc View File


BIN
Forums/Classifier/__pycache__/__init__.cpython-311.pyc View File


BIN
Forums/Classifier/__pycache__/classify_product.cpython-310.pyc View File


BIN
Forums/Classifier/__pycache__/classify_product.cpython-311.pyc View File


BIN
Forums/Classifier/__pycache__/transformer.cpython-310.pyc View File


BIN
Forums/Classifier/__pycache__/transformer.cpython-311.pyc View File


BIN
Forums/DB_Connection/__pycache__/__init__.cpython-310.pyc View File


BIN
Forums/DB_Connection/__pycache__/__init__.cpython-311.pyc View File


BIN
Forums/DB_Connection/__pycache__/db_connection.cpython-310.pyc View File


BIN
Forums/DB_Connection/__pycache__/db_connection.cpython-311.pyc View File


BIN
Forums/Utilities/__pycache__/__init__.cpython-310.pyc View File


BIN
Forums/Utilities/__pycache__/__init__.cpython-311.pyc View File


BIN
Forums/Utilities/__pycache__/utilities.cpython-310.pyc View File


BIN
Forums/Utilities/__pycache__/utilities.cpython-311.pyc View File


BIN
Forums/__pycache__/__init__.cpython-310.pyc View File


BIN
Forums/__pycache__/__init__.cpython-311.pyc View File


BIN
MarketPlaces/BlackPyramid/__pycache__/crawler_selenium.cpython-310.pyc View File


BIN
MarketPlaces/BlackPyramid/__pycache__/parser.cpython-310.pyc View File


BIN
MarketPlaces/Classifier/__pycache__/__init__.cpython-310.pyc View File


BIN
MarketPlaces/Classifier/__pycache__/__init__.cpython-311.pyc View File


BIN
MarketPlaces/Classifier/__pycache__/classify_product.cpython-310.pyc View File


BIN
MarketPlaces/Classifier/__pycache__/classify_product.cpython-311.pyc View File


BIN
MarketPlaces/Classifier/__pycache__/transformer.cpython-310.pyc View File


BIN
MarketPlaces/Classifier/__pycache__/transformer.cpython-311.pyc View File


+ 12
- 12
MarketPlaces/DarkMatter/crawler_selenium.py View File

@ -32,17 +32,17 @@ baseURL = 'http://darkmat3kdxestusl437urshpsravq7oqb7t3m36u2l62vnmmldzdmid.onion
# Opens Tor Browser, crawls the website, then parses, then closes tor # Opens Tor Browser, crawls the website, then parses, then closes tor
#acts like the main method for the crawler, another function at the end of this code calls this function later #acts like the main method for the crawler, another function at the end of this code calls this function later
def startCrawling(): def startCrawling():
# opentor()
opentor()
mktName = getMKTName() mktName = getMKTName()
# driver = getAccess()
driver = getAccess()
# if driver != 'down':
# try:
# login(driver)
# crawlForum(driver)
# except Exception as e:
# print(driver.current_url, e)
# closetor(driver)
if driver != 'down':
try:
login(driver)
crawlForum(driver)
except Exception as e:
print(driver.current_url, e)
closetor(driver)
new_parse(mktName, baseURL, False) new_parse(mktName, baseURL, False)
@ -190,11 +190,11 @@ def getInterestedLinks():
# legit # legit
links.append('http://darkmat3kdxestusl437urshpsravq7oqb7t3m36u2l62vnmmldzdmid.onion/market/products/?category=78') links.append('http://darkmat3kdxestusl437urshpsravq7oqb7t3m36u2l62vnmmldzdmid.onion/market/products/?category=78')
# # hack guides # # hack guides
# links.append('http://darkmat3kdxestusl437urshpsravq7oqb7t3m36u2l62vnmmldzdmid.onion/market/products/?category=94')
links.append('http://darkmat3kdxestusl437urshpsravq7oqb7t3m36u2l62vnmmldzdmid.onion/market/products/?category=94')
# # services # # services
# links.append('http://darkmat3kdxestusl437urshpsravq7oqb7t3m36u2l62vnmmldzdmid.onion/market/products/?category=117')
links.append('http://darkmat3kdxestusl437urshpsravq7oqb7t3m36u2l62vnmmldzdmid.onion/market/products/?category=117')
# # software/malware # # software/malware
# links.append('http://darkmat3kdxestusl437urshpsravq7oqb7t3m36u2l62vnmmldzdmid.onion/market/products/?category=121')
links.append('http://darkmat3kdxestusl437urshpsravq7oqb7t3m36u2l62vnmmldzdmid.onion/market/products/?category=121')
return links return links


+ 1
- 1
MarketPlaces/Initialization/marketsList.txt View File

@ -1 +1 @@
DigitalThriftShop
M00nkeyMarket

+ 3
- 7
MarketPlaces/Initialization/prepare_parser.py View File

@ -224,8 +224,7 @@ def new_parse(marketPlace, url, createLog):
else: else:
parseError = True parseError = True
except Exception as e:# change back
print(e)
except:
nError += 1 nError += 1
print("There was a problem to parse the file " + line1 + " in the listing section!") print("There was a problem to parse the file " + line1 + " in the listing section!")
@ -268,7 +267,7 @@ def new_parse(marketPlace, url, createLog):
try: try:
persist_data(url, tuple(rec), cur) persist_data(url, tuple(rec), cur)
con.commit() con.commit()
except Exception as e:
except:
trace = traceback.format_exc() trace = traceback.format_exc()
@ -291,10 +290,7 @@ def new_parse(marketPlace, url, createLog):
try: try:
shutil.move(source, destination) shutil.move(source, destination)
num_persisted_moved += 1 num_persisted_moved += 1
except Exception as e:
# except:
print(e)
except:
print("There was a problem to move the file " + detPage[key]['filename'] + " in the Description section!") print("There was a problem to move the file " + detPage[key]['filename'] + " in the Description section!")
nError += 1 nError += 1
if createLog: if createLog:


+ 2
- 2
MarketPlaces/M00nkeyMarket/crawler_selenium.py View File

@ -153,7 +153,7 @@ def login(driver):
# Password here # Password here
passwordBox.send_keys('genie_show_metheWorld') passwordBox.send_keys('genie_show_metheWorld')
input("Press ENTER when CAPTCHA and exit pressed is completed\n")
input("Press ENTER when CAPTCHA and exit pressed is completed\nWAIT FOR PAGE TO LOAD SOMETIMES THY SEND NEWSLETTERS")
# wait for listing page show up (This Xpath may need to change based on different seed url) # wait for listing page show up (This Xpath may need to change based on different seed url)
WebDriverWait(driver, 100).until(EC.visibility_of_element_located( WebDriverWait(driver, 100).until(EC.visibility_of_element_located(
@ -203,7 +203,7 @@ def getInterestedLinks():
# software # software
links.append('http://moonkey4f2mkcp6hpackeea356puiry27h3dz3hzbt3adbmsk4gs7wyd.onion/search/subcategories?subcategory=30') links.append('http://moonkey4f2mkcp6hpackeea356puiry27h3dz3hzbt3adbmsk4gs7wyd.onion/search/subcategories?subcategory=30')
# # guides # # guides
# links.append('http://moonkey4f2mkcp6hpackeea356puiry27h3dz3hzbt3adbmsk4gs7wyd.onion/search/subcategories?subcategory=17')
links.append('http://moonkey4f2mkcp6hpackeea356puiry27h3dz3hzbt3adbmsk4gs7wyd.onion/search/subcategories?subcategory=17')
return links return links


BIN
MarketPlaces/__pycache__/__init__.cpython-310.pyc View File


BIN
MarketPlaces/__pycache__/__init__.cpython-311.pyc View File


Loading…
Cancel
Save