reply.py 1.8 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061
  1. from selenium.webdriver.common.action_chains import ActionChains
  2. from selenium.common.exceptions import NoSuchElementException
  3. import random
  4. import time
  5. def reply(driver, url):
  6. while True:
  7. reply_page_url = get_reply_page_url(driver, url)
  8. driver.get(reply_page_url)
  9. content = get_reply_content(driver)
  10. if not content == '#':
  11. if start_reply(driver, content):
  12. break
  13. time.sleep(2)
  14. # 进行回复动作
  15. def start_reply(driver, content):
  16. try:
  17. message = driver.find_element_by_id('vmessage')
  18. except NoSuchElementException:
  19. return False
  20. else:
  21. ActionChains(driver).move_to_element(message).double_click().perform()
  22. time.sleep(5)
  23. message.send_keys(content)
  24. print(content)
  25. time.sleep(1)
  26. element = driver.find_element_by_id('vreplysubmit')
  27. ActionChains(driver).move_to_element(element).click().perform()
  28. return True
  29. # 读取从上往下第二条评论的内容,并返回
  30. def get_reply_content(driver):
  31. i = 4
  32. while i >= 0:
  33. r = random.randint(3, 12)
  34. r = str(r)
  35. try:
  36. element = driver.find_element_by_xpath(
  37. "//div[@id='postlist']/div[" + r + "]/table/tbody/tr/td[2]/div[2]/div/div/table/tbody/tr/td")
  38. except NoSuchElementException:
  39. i = i - 1
  40. else:
  41. content = element.text
  42. if '发表于' not in content:
  43. return content
  44. else:
  45. i = i - 1
  46. return '#'
  47. # 取得mod发布页面的最后一个页面的url
  48. def get_reply_page_url(driver, url):
  49. driver.get(url)
  50. r = random.randint(0, 24)
  51. r = str(r)
  52. element = driver.find_element_by_xpath("//form[@id='moderate']/table/tbody[last()-" + r + "]/tr/th/a[3]")
  53. return element.get_attribute('href')