利用uiautomator2加模拟器自动刷抖音下载无水印视频

suyaming 发表于 2021-10-7 17:41

本帖最后由 suyaming 于 2021-10-7 19:27 编辑

### 准备

1.adb
2.任意模拟器，我这里用的是夜神

### 成果展示

...试了半天，找不到处理gif的办法，40多m，放蓝奏自己看吧
[这里](https://suyaming.lanzoui.com/iNlrLv1hwyf)

颜值检测效果

### 代码
```
import base64
import os
import time
import re
import uiautomator2 as u2
import requests
from jsonpath import jsonpath
from concurrent.futures import ThreadPoolExecutor

def get_mid_str(s, start_str, stop_str):
# 查找左边文本的结束位置
start_pos = s.find(start_str)
if start_pos == -1:
   return None
start_pos += len(start_str)
# 查找右边文本的起始位置
stop_pos = s.find(stop_str, start_pos)
if stop_pos == -1:
   return None

# 通过切片取出中间的文本
return s

class DouyinDown:
def __init__(self):
   self.device = u2.connect('127.0.0.1:62001')# 这里改成自己的设备
   self.down_url = []

def get_downurl(self):
   de = self.device
   de.app_start('com.ss.android.ugc.aweme')
   while True:
         if len(self.down_url) <= 5:
            share_btn = de(resourceId="com.ss.android.ugc.aweme:id/share_container")
            if de(text='点击进入直播间').exists:
               de.swipe_ext('up', 1)
               print("直播间,跳过")
            else:
               if self.check_beauty() is True:
                     share_btn.click()
                     if share_btn.exists:
                        share_btn.click()
                     else:
                        if de(text='复制链接').exists:
                           de(text='复制链接').click()
                        else:
                           zb = de.xpath('//*[@resource-id="com.ss.android.ugc.aweme:id/is-"]').rect
                           de.swipe(zb + 400, zb + 50, zb, zb + 20, 0.05)
                           de(text='复制链接').click()
                        self.down_url.append(de.clipboard)
                        de.swipe_ext('up', 1)
               else:
                     de.swipe_ext('up', 1)
         else:
            time.sleep(5)

def check_beauty(self):
   api_key = '' # 百度开放平台api_key
   secret_key = '' # 百度开放平台secret_key
   url = 'https://aip.baidubce.com/oauth/2.0/token?grant_type=client_credentials&client_id=' + api_key + '&client_secret=' + secret_key
   get_acces_token = requests.get(url).json()
   acces_token = jsonpath(get_acces_token, '$..access_token')
   de = self.device
   time.sleep(2)
   screenshot = de.xpath('//*[@resource-id="com.ss.android.ugc.aweme:id/ge0"]').screenshot()
   screenshot.save('screenshot.jpg')
   with open('screenshot.jpg', 'rb') as f:
         base64_data = base64.b64encode(f.read())
   request_url = "https://aip.baidubce.com/rest/2.0/face/v3/detect"
   post_data = {
         "image": base64_data,
         "image_type": "BASE64",
         "face_field": "gender,age,beauty,gender",
         "face_type": "LIVE"
   }
   headers = {
         "Content-Type": "application/json;"
   }
   age, beauty, gender = 0, 0, 'male'
   request_url = request_url + "?access_token=" + acces_token
   response = requests.post(url=request_url, data=post_data, headers=headers)
   json_result = response.json()
   error_msg = jsonpath(json_result, '$..error_msg')
   if error_msg == 'SUCCESS':
         age = jsonpath(json_result, '$..age')
         beauty = jsonpath(json_result, '$..beauty')
         gender = jsonpath(json_result, '$..type')
         print(age, beauty, gender)
   else:
         print('未识别到人脸')
         return False
   if int(age) <= 30 and int(beauty) >= 60 and gender == 'female':
         return True
   else:
         return False

def down_video(self):
   headers = {
         'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/92.0.4515.107 Safari/537.36'
   }
   while True:
         if len(self.down_url) == 0:
            time.sleep(5)
         else:
            url = re.search('https://+', self.down_url).group()
            video_id = get_mid_str(requests.get(url).url, 'video/', '?previous')
            respone = requests.get('https://www.iesdouyin.com/web/api/v2/aweme/iteminfo/?item_ids=' + video_id,
                                    headers=headers)
            video_url = jsonpath(respone.json(), '$.item_list.video.play_addr.url_list').replace('playwm',
                                                                                                         'play')
            video_content = requests.get(video_url, headers=headers).content
            with open(video_id + '.mp4', 'wb') as data:
               data.write(video_content)
               print('下载成功')
            del (self.down_url)

def main(self):
   with ThreadPoolExecutor(max_workers=2) as t:
         t.submit(self.get_downurl)
         t.submit(self.down_video)

if __name__ == '__main__':
DouyinDown().main()
```
### TODO
如果需要的人多的话，后期考虑更新。
目前我发现可以优化的点有:
1.过滤广告
2.监测某一个用户
3.根据颜值，性别等选择是否下载(已完成)
### 更新
已加入颜值检查，用的是百度智能云的人脸检测接口，目前设置是，性别女，年龄30以下，颜值60分以上

suyaming 发表于 2021-10-8 04:12

网页版
import base64
import time
import requests
from selenium.common import exceptions
from jsonpath import jsonpath
from selenium import webdriver

def check_beauty():
api_key = ''
secret_key = ''
url = 'https://aip.baidubce.com/oauth/2.0/token?grant_type=client_credentials&client_id=' + api_key + '&client_secret=' + secret_key
get_acces_token = requests.get(url).json()
acces_token = jsonpath(get_acces_token, '$..access_token')
with open('screenshot.png', 'rb') as f:
   base64_data = base64.b64encode(f.read())
request_url = "https://aip.baidubce.com/rest/2.0/face/v3/detect"
post_data = {
   "image": base64_data,
   "image_type": "BASE64",
   "face_field": "gender,age,beauty,gender",
   "face_type": "LIVE"
}
headers = {
   "Content-Type": "application/json;"
}
age, beauty, gender = 0, 0, 'male'
try:
   request_url = request_url + "?access_token=" + acces_token
   response = requests.post(url=request_url, data=post_data, headers=headers)
   json_result = response.json()
   error_msg = jsonpath(json_result, '$..error_msg')
   if error_msg == 'SUCCESS':
         age = jsonpath(json_result, '$..age')
         beauty = jsonpath(json_result, '$..beauty')
         gender = jsonpath(json_result, '$..type')
   else:
         print('未识别到人脸')
         return False
   if int(age) <= 30 and int(beauty) >= 60 and gender == 'female':
         return True
   else:
         return False
except:
   pass

class DouyinDown:
def __init__(self):
   options = webdriver.ChromeOptions()
   self.webdriver = webdriver.Chrome(options=options)
   self.down_url = ''
   self.url_title = ''

def get_downurl_web(self):

   driver = self.webdriver
   driver.implicitly_wait(10)
   driver.get('https://www.douyin.com/recommend')
   input('请手动登录继续，完成后输入任意键')
   while True:
         time.sleep(4)
         driver.find_element_by_xpath(
            '//*[@id="root"]/div/div/div/div/div/div/div').screenshot(
            'screenshot.png')
         state_code = check_beauty()
         try:
            if state_code is True:
               driver.find_element_by_xpath('//*[@id="root"]//div/div/div/div/div').click()
               url = driver.find_element_by_xpath('//*[@id="root"]//video').get_attribute('src')
               url_name_elenment = driver.find_elements_by_xpath('//*[@id="root"]//span/span/span/span/span')
               url_name_group = []
               for i in url_name_elenment:
                     url_name_group.append(i.text)
               url_name = '_'.join(url_name_group)
               print('下载中...')
               self.down_url = url
               self.url_title = url_name
               self.down_video_web()
            elif state_code is False:
               print('跳过')
               pass
            driver.find_element_by_xpath('//*[@id="root"]//xg-bar/div/div/div/div').click()
         except exceptions.StaleElementReferenceException:
            print('元素被刷新,下一个')
            driver.find_element_by_xpath('//*[@id="root"]//xg-bar/div/div/div/div').click()
         except Exception as msg:
            print(msg)
            print('异常')
            input('请完成验证码后继续')

def down_video_web(self):
   headers = {
         'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/92.0.4515.107 Safari/537.36'
   }
   video_url = self.down_url
   viede_name = self.url_title
   video_content = requests.get(video_url, headers=headers).content
   with open(viede_name + '.mp4', 'wb') as data:
         data.write(video_content)
         print('下载成功')

if __name__ == '__main__':
DouyinDown().get_downurl_web()

kyx120 发表于 2021-10-7 17:47

这么牛B!,试一下。

kyx120 发表于 2021-10-7 17:50

我就想知道。怎么判断颜值

suyaming 发表于 2021-10-7 17:53

kyx120 发表于 2021-10-7 17:50
我就想知道。怎么判断颜值

人脸识别API

打酱油嘀兔子 发表于 2021-10-7 17:54

这么牛B!,试一下!!!!!

a2581069 发表于 2021-10-7 18:18

浪费电了。。。是收益考虑的还是

小木曾雪菜 发表于 2021-10-7 20:12

有没有办法用pc网页版登陆抖音下载？

suyaming 发表于 2021-10-7 21:05

小木曾雪菜发表于 2021-10-7 20:12
有没有办法用pc网页版登陆抖音下载？

有道理啊，我试试

evill 发表于 2021-10-7 22:07

kyx120 发表于 2021-10-7 17:50
我就想知道。怎么判断颜值

仔细看代码：
https://aip.baidubce.com/rest/2.0/face/v3/detect

页: [1] 2 3

吾爱破解 - 52pojie.cn's Archiver

利用uiautomator2加模拟器自动刷抖音下载无水印视频