spider_poc.py 1.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758
  1. import os
  2. import sys
  3. import time
  4. import uiautomator2 as u2
  5. from cnocr import CnOcr
  6. def spider_poc(serial):
  7. d = u2.connect(serial)
  8. d.screen_on()
  9. d.unlock()
  10. d.debug = False
  11. d.app_stop("com.facebook.katana")
  12. d.app_start("com.facebook.katana", use_monkey=True)
  13. time.sleep(3)
  14. # 搜索
  15. d.xpath('//*[@content-desc="搜索"]').click(timeout=3)
  16. # 点击搜索框
  17. d.xpath('//*[@text="搜索"]').click(timeout=3)
  18. # 输入搜索关键词
  19. d(focused=True).set_text('电子元器件')
  20. # 点击搜索
  21. d.press('enter')
  22. time.sleep(6)
  23. # 点击帖子
  24. d.xpath('//*[@content-desc="帖子个搜索结果"]').click(timeout=3)
  25. time.sleep(6)
  26. # 点击展开
  27. d.click(0.461, 0.29)
  28. # 图片识别
  29. root_dir = os.path.dirname(sys.argv[0])
  30. screenshot_name = f'screenshots/{time.time()}.png'
  31. screenshot_dir = os.path.join(root_dir, screenshot_name)
  32. d.screenshot().save(screenshot_dir)
  33. ocr = CnOcr()
  34. res = ocr.ocr(screenshot_dir)
  35. # print(res)
  36. # 找到包含“你的快拍”的元素
  37. text_before_join = ""
  38. for item in res:
  39. if item['text'] in '加入':
  40. break
  41. text_before_join += item['text']
  42. print(text_before_join)
  43. if __name__ == "__main__":
  44. spider_poc('5D7HSG5XXCKVBI85')