python bilibili 批量下载-GUI

bilibili_video_download-GUI page.py.txt
requirements.txt
Version: Python3
安装依赖库
pip3 install -r requirements.txt
带用户界面,可批量,可下用户所有视频

# !/usr/bin/python
# -*- coding:utf-8 -*-
# time: 2019/07/02--08:12
__author__ = 'Henry'


'''
项目: B站视频下载 - GUI版本
版本1: 加密API版,不需要加入cookie,直接即可下载1080p视频
20190422 - 增加多P视频单独下载其中一集的功能
20190702 - 增加视频多线程下载 速度大幅提升
20190711 - 增加GUI版本,可视化界面,操作更加友好
'''

import requests, time, hashlib, urllib.request, re, json,random
import imageio
imageio.plugins.ffmpeg.download()
# 如果下载ffmpeg.win32.exe超时,手动下载ffmpeg.win32.exe并放到C:\Users\Administrator\AppData\Local\imageio\ffmpeg\下
from moviepy.editor import *
import os, sys, threading



from tkinter import *
from tkinter import ttk
from tkinter import StringVar
root=Tk()
start_time = time.time()

# 将输出重定向到表格
def print(theText):
    msgbox.insert(END,theText+'\n')


# 访问API地址
def get_play_list(start_url, cid, quality):
    entropy = 'rbMCKn@KuamXWlPMoJGsKcbiJKUfkPF_8dABscJntvqhRSETg'
    appkey, sec = ''.join([chr(ord(i) + 2) for i in entropy[::-1]]).split(':')
    params = 'appkey=%s&cid=%s&otype=json&qn=%s&quality=%s&type=' % (appkey, cid, quality, quality)
    chksum = hashlib.md5(bytes(params + sec, 'utf8')).hexdigest()
    url_api = 'https://interface.bilibili.com/v2/playurl?%s&sign=%s' % (params, chksum)
    headers = {
        'Referer': start_url,  # 注意加上referer
        'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36'
    }
    # print(url_api)
    html = requests.get(url_api, headers=headers).json()
    # print(json.dumps(html))
    video_list = []
    for i in html['durl']:
        video_list.append(i['url'])
    # print(video_list)
    return video_list


# 下载视频
'''
 urllib.urlretrieve 的回调函数:
def callbackfunc(blocknum, blocksize, totalsize):
    @blocknum:  已经下载的数据块
    @blocksize: 数据块的大小
    @totalsize: 远程文件的大小
'''


def Schedule_cmd(blocknum, blocksize, totalsize):
    speed = (blocknum * blocksize) / (time.time() - start_time)
    # speed_str = " Speed: %.2f" % speed
    speed_str = " Speed: %s" % format_size(speed)
    recv_size = blocknum * blocksize

    # 设置下载进度条
    pervent = recv_size / totalsize
    percent_str = "%.2f%%" % (pervent * 100)
    download.coords(fill_line1,(0,0,pervent*465,23))
    root.update()
    pct.set(percent_str)



def Schedule(blocknum, blocksize, totalsize):
    speed = (blocknum * blocksize) / (time.time() - start_time)
    # speed_str = " Speed: %.2f" % speed
    speed_str = " Speed: %s" % format_size(speed)
    recv_size = blocknum * blocksize

    # 设置下载进度条
    f = sys.stdout
    pervent = recv_size / totalsize
    percent_str = "%.2f%%" % (pervent * 100)
    n = round(pervent * 50)
    s = ('#' * n).ljust(50, '-')
    print(percent_str.ljust(6, ' ') + '-' + speed_str)
    f.flush()
    time.sleep(2)
    # print('\r')


# 字节bytes转化K\M\G
def format_size(bytes):
    try:
        bytes = float(bytes)
        kb = bytes / 1024
    except:
        print("传入的字节格式不对")
        return "Error"
    if kb >= 1024:
        M = kb / 1024
        if M >= 1024:
            G = M / 1024
            return "%.3fG" % (G)
        else:
            return "%.3fM" % (M)
    else:
        return "%.3fK" % (kb)


#  下载视频
def down_video(video_list, title, start_url, page):
    num = 1 

    print('[正在下载P{}段视频,请稍等...]:'.format(page) + title+sys.path[0])
    currentVideoPath = os.path.join(sys.path[0], 'bilibili_video',title)  # 当前目录作为下载目录
    for i in video_list:
        opener = urllib.request.build_opener()
        # 请求头
        opener.addheaders = [
            # ('Host', 'upos-hz-mirrorks3.acgvideo.com'),  #注意修改host,不用也行
            ('User-Agent', 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10.13; rv:56.0) Gecko/20100101 Firefox/56.0'),
            ('Accept', '*/*'),
            ('Accept-Language', 'en-US,en;q=0.5'),
            ('Accept-Encoding', 'gzip, deflate, br'),
            ('Range', 'bytes=0-'),  # Range 的值要为 bytes=0- 才能下载完整视频
            ('Referer', start_url),  # 注意修改referer,必须要加的!
            ('Origin', 'https://www.bilibili.com'),
            ('Connection', 'keep-alive'),
        ]
        urllib.request.install_opener(opener)
        # 创建文件夹存放下载的视频
        if not os.path.exists(currentVideoPath):
            os.makedirs(currentVideoPath)
        # 开始下载
        if len(video_list) > 1:
            urllib.request.urlretrieve(url=i, filename=os.path.join(currentVideoPath, r'{}-{}.flv'.format(title, num)),reporthook=Schedule_cmd)  # 写成mp4也行  title + '-' + num + '.flv'
        else:
            urllib.request.urlretrieve(url=i, filename=os.path.join(currentVideoPath, r'{}.flv'.format(title)),reporthook=Schedule_cmd)  # 写成mp4也行  title + '-' + num + '.flv'
        num += 1

# 合并视频(20190802新版)
def combine_video(title_list):
    video_path = os.path.join(sys.path[0], 'bilibili_video')  # 下载目录
    for title in title_list:
        current_video_path = os.path.join(video_path ,title)
        if len(os.listdir(current_video_path)) >= 2:
            # 视频大于一段才要合并
            print('[下载完成,正在合并视频...]:' + title)
            # 定义一个数组
            L = []
            # 遍历所有文件
            for file in sorted(os.listdir(current_video_path), key=lambda x: int(x[x.rindex("-") + 1:x.rindex(".")])):
                # 如果后缀名为 .mp4/.flv
                if os.path.splitext(file)[1] == '.flv':
                    # 拼接成完整路径
                    filePath = os.path.join(current_video_path, file)
                    # 载入视频
                    video = VideoFileClip(filePath)
                    # 添加到数组
                    L.append(video)
            # 拼接视频
            final_clip = concatenate_videoclips(L)
            # 生成目标视频文件
            final_clip.to_videofile(os.path.join(current_video_path, r'{}.mp4'.format(title)), fps=24, remove_temp=False)
            print('[视频合并完成]' + title)
            print(os.path.join(video_path ,title))
        else:
            # 视频只有一段则直接打印下载完成
            print('[视频合并完成]:' + title)
            print(os.path.join(video_path ,title))

def _getAvsFromPage(user,pagemount,page):
    inputs = []
    if len(pagemount.strip())>0:
        print ("down a page:user= "+user +", page size= "+pagemount+", page no.= "+page)
        inputs = __getAvsFromPage(user,pagemount,page)
    else :
        print ("down all av from user= " + user)
        pg = 1
        while True:
           inputpage = __getAvsFromPage(user,"50",str(pg)) 
           pg = pg + 1
           if len(inputpage)>0:
               inputs = inputs + inputpage
           else:
               break
    tip = ""
    for av in inputs:
        tip = tip + av + ","
    print (tip+"\n一共找到av个数:"+str(len(inputs)))
    return inputs
            
def __getAvsFromPage(user,pagemount,page):
    inputs = []
    # 使用手机UA
    headers = {
      "User-Agent": "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/604.1.38 (KHTML, like Gecko) Version/11.0 Mobile/15A372 Safari/604.1"
    }
    # 视频url
    video_url = "https://space.bilibili.com/ajax/member/getSubmitVideos?mid="+user+"&pagesize="+pagemount+"&tid=0&page="+page+"&keyword=&order=pubdate"
    html = requests.get(url=video_url, headers=headers).content.decode('utf-8')
    #cid = re.findall(r"comment: '//comment.bilibili.com/' \+ (.*?) \+ '.xml',", html)
    #print (html)
    uservideo = json.loads(html)
    #print (str(uservideo['data']['vlist'][0]['aid']))
    #print (str(uservideo['data']['vlist'][0]['title']))
    for vid in uservideo['data']['vlist']:
        inputs.append(str(vid['aid']))
    return inputs    
         
def _getAvNos(inputStart):    
    if inputStart.find(';')>0 : #多个av号  或者多个 av  url
        inputs = inputStart.split(";")
        intype = 2
    elif  inputStart.strip().isdigit() == True or re.search(r'/av(\d+)/*', inputStart.strip())!=None: #single av number
        inputs = [inputStart]
        intype = 1
    elif inputStart.find(',')>0  : #  下载视频“用户,页容量,页号” 格式
        ups = inputStart.strip().split(",")
        inputs=_getAvsFromPage(str(ups[0]),str(ups[1]),str(ups[2]))
        intype = 0
    else:
        inputs=[]
        print("错误的格式")
    return inputs,intype

def do_prepare(inputStart,inputQuality):
    # 清空进度条
    download.coords(fill_line1,(0,0,0,23))
    pct.set('0.00%')
    root.update()
    # 清空文本栏
    msgbox.delete('1.0','end')
    start_time = time.time()
    #分割输入的url或者av号
    inputs,intype = _getAvNos(inputStart)
    for inputStart in inputs:
        # 用户输入av号或者视频链接地址
        print('*' * 30 + 'B站视频下载小助手' + '*' * 30)
        start = inputStart.strip()
        avno = ""
        if start.isdigit() == True:  # 如果输入的是av号
            # 获取cid的api, 传入aid即可
            start_url = 'https://api.bilibili.com/x/web-interface/view?aid=' + start
            avno = start
        else:
            # https://www.bilibili.com/video/av46958874/?spm_id_from=333.334.b_63686965665f7265636f6d6d656e64.16
            print ("deal with "+start)
            avno = re.search(r'/av(\d+)/*', start).group(1)
            start_url = 'https://api.bilibili.com/x/web-interface/view?aid=' + avno
    
        # 视频质量
        # <accept_format><![CDATA[flv,flv720,flv480,flv360]]></accept_format>
        # <accept_description><![CDATA[高清 1080P,高清 720P,清晰 480P,流畅 360P]]></accept_description>
        # <accept_quality><![CDATA[80,64,32,16]]></accept_quality>
        quality = inputQuality
        # 获取视频的cid,title
        headers = {
            'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36'
        }
        html = requests.get(start_url, headers=headers).json()
        data = html['data']
        cid_list = []
        if '?p=' in start:
            # 单独下载分P视频中的一集
            p = re.search(r'\?p=(\d+)',start).group(1)
            cid_list.append(data['pages'][int(p) - 1])
        else:
            # 如果p不存在就是全集下载
            cid_list = data['pages']
        # print(cid_list)
        # 创建线程池
        threadpool = []
        title_list = []
        if intype == 0:#此三句->用户视频只下载单视频,无多p
            if len(cid_list)>1:
                cid_list = []
        for item in cid_list:
            cid = str(item['cid'])
            title = item['part']
            title = re.sub(r'[\/\\:*?"<>|]', '', title)  # 替换为空的
            title =title+"avno"+avno
            print('[下载视频的cid]:' + cid)
            print('[下载视频的标题]:' + title)
            title_list.append(title)
            page = str(item['page'])
            start_url = start_url + "/?p=" + page
            video_list = get_play_list(start_url, cid, quality)
            start_time = time.time()
            # down_video(video_list, title, start_url, page)
            # 定义线程
            th = threading.Thread(target=down_video, args=(video_list, title, start_url, page))
            # 将线程加入线程池
            threadpool.append(th)

        # 开始线程
        for th in threadpool:
            th.setDaemon(True)
            th.start()
        # 等待所有线程运行完毕
        for th in threadpool:
            th.join()
        
        # 最后合并视频
        combine_video(title_list)
    
        end_time = time.time()  # 结束时间
        print('下载总耗时%.2f秒,约%.2f分钟' % (end_time - start_time, int(end_time - start_time) / 60))
    
        # 如果是windows系统,下载完成后打开下载目录
        currentVideoPath = os.path.join(sys.path[0], 'bilibili_video')  # 当前目录作为下载目录
        if (sys.platform.startswith('win')):
            os.startfile(currentVideoPath)
            
        time.sleep(5)



def thread_it(func, *args):
    '''将函数打包进线程'''
    # 创建
    t = threading.Thread(target=func, args=args) 
    # 守护 !!!
    t.setDaemon(True) 
    # 启动
    t.start()
    #等待结束
    #t.join()


if __name__ == "__main__":
    # 设置标题
    root.title('B站视频下载小助手-GUI')
    # 设置ico
    root.iconbitmap('./Pic/favicon.ico')
    # 设置Logo
    photo = PhotoImage(file='./Pic/logo.png')
    logo = Label(root,image=photo)
    logo.pack()
    # 各项输入栏和选择框
    inputStart = Entry(root,bd=4,width=600)
    labelStart=Label(root,text="请输入您要下载的B站av号(多号;分割)或者视频链接地址(多url;分割)或者mid用户号pc页容量pn页码(用,分割)--(用户号,,表示所有该用户视频)") # 地址输入
    labelStart.pack(anchor="w")
    inputStart.pack()
    labelQual = Label(root,text="请选择您要下载视频的清晰度") # 清晰度选择
    labelQual.pack(anchor="w")
    inputQual = ttk.Combobox(root,state="readonly")
    # 可供选择的表
    inputQual['value']=('1080P','720p','480p','360p')
    # 对应的转换字典
    keyTrans=dict()
    keyTrans['1080P']='80'
    keyTrans['720p']='64'
    keyTrans['480p']='32'
    keyTrans['360p']='16'
    # 初始值为720p
    inputQual.current(0)
    inputQual.pack()
    confirm = Button(root,text="开始下载",command=lambda:thread_it(do_prepare,inputStart.get(), keyTrans[inputQual.get()] ))
    msgbox = Text(root)
    msgbox.insert('1.0',"------------------\n用户名,,\n(eg:  20862117,,) 表示获取用户20862117所有视频\n")
    msgbox.insert('1.0',"------------------\n用户名,每页容量,第几页(页号从1开始)\n(eg:  20862117,100,2) 表示用户20862117,每页100av,获取第2页\n")
    msgbox.insert('1.0',"------------------\n多个av号,用;分割\n(eg:49853211;23995112;9855566)\n多个视频链接地址,用;分割\n(eg:https://www.bilibili.com/video/av49842011;https://www.bilibili.com/video/av48562233)\n")
    msgbox.insert('1.0',"对于单P视频:直接传入B站av号或者视频链接地址\n(eg: 49842011或者https://www.bilibili.com/video/av49842011)\n对于多P视频:\n1.下载全集:直接传入B站av号或者视频链接地址\n(eg: 49842011或者https://www.bilibili.com/video/av49842011)\n2.下载其中一集:传入那一集的视频链接地址\n(eg: https://www.bilibili.com/video/av19516333/?p=2)\n")

    msgbox.pack()
    download=Canvas(root,width=465,height=23,bg="white")
    # 进度条的设置
    labelDownload=Label(root,text="下载进度")
    labelDownload.pack(anchor="w")
    download.pack()
    fill_line1 = download.create_rectangle(0, 0, 0, 23, width=0, fill="green")
    pct=StringVar()
    pct.set('0.0%')
    pctLabel = Label(root,textvariable=pct)
    pctLabel.pack()
    root.geometry("600x800")
    confirm.pack()
    # GUI主循环
    root.mainloop()
    
发表新评论
仅有 1 条评论
  1. root
    root本文作者
    回复

    GUI-2.0版 bv号 视频下载 ,修改 av号代码如下:
    start_url = 'https://api.bilibili.com/x/web-interface/view?bvid=BV' + re.search(r'/BV.*??', start+"?").group(0)[3:-1]