练习一下新的logging和requests包的post办法。
https://github.com/cnbeining/srt2bilibili
需要的依赖较多,安装愉快。
代码下面。
如果ASS:https://pypi.python.org/pypi/asstosrt/0.1.3 然后走起。
#!/usr/bin/env python #coding:utf-8 # Author: Beining --<ACICFG> # Purpose: A batch poster of srt file to danmaku on Bilibili. # Created: 11/23/2014 # srt2Bilibili is licensed under GNUv2 license ''' srt2Bilibili 0.0.1 Beining@ACICFG cnbeining[at]gmail.com http://www.cnbeining.com https://github.com/cnbeining/srt2bilibili GNUv2 license ''' import sys import os import random import requests import urllib import pysrt import logging import hashlib import time as time_old import getopt from xml.dom.minidom import parse, parseString import xml.dom.minidom global FAKE_HEADER, APPKEY, SECRETKEY, VER, rnd, cid FAKE_HEADER = { 'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_9_0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/31.0.1650.63 Safari/537.36', 'Cache-Control': 'no-cache', 'Pragma': 'no-cache'} APPKEY = '85eb6835b0a1034e' SECRETKEY = '2ad42749773c441109bdc0191257a664' VER = '0.01' #---------------------------------------------------------------------- def calc_sign(string): """str/any->str return MD5. From: Biligrab, https://github.com/cnbeining/Biligrab MIT License""" return str(hashlib.md5(str(string).encode('utf-8')).hexdigest()) #---------------------------------------------------------------------- def find_cid_api(vid, p): """find cid and print video detail str,int?,str->str TODO: Use json. From: Biligrab, https://github.com/cnbeining/Biligrab MIT License""" cid = 0 if str(p) is '0' or str(p) is '1': str2Hash = 'appkey={APPKEY}&id={vid}&type=xml{SECRETKEY}'.format(APPKEY = APPKEY, vid = vid, SECRETKEY = SECRETKEY) biliurl = 'https://api.bilibili.com/view?appkey={APPKEY}&id={vid}&type=xml&sign={sign}'.format(APPKEY = APPKEY, vid = vid, SECRETKEY = SECRETKEY, sign = calc_sign(str2Hash)) else: str2Hash = 'appkey={APPKEY}&id={vid}&page={p}&type=xml{SECRETKEY}'.format(APPKEY = APPKEY, vid = vid, p = p, SECRETKEY = SECRETKEY) biliurl = 'https://api.bilibili.com/view?appkey={APPKEY}&id={vid}&page={p}&type=xml&sign={sign}'.format(APPKEY = APPKEY, vid = vid, SECRETKEY = SECRETKEY, p = p, sign = calc_sign(str2Hash)) logging.debug(biliurl) logging.info('Fetching webpage...') try: request = urllib.request.Request(biliurl, headers=BILIGRAB_HEADER) response = urllib.request.urlopen(request) data = response.read() dom = parseString(data) for node in dom.getElementsByTagName('cid'): if node.parentNode.tagName == "info": cid = node.toxml()[5:-6] logging.info('cid is ' + cid) break return cid except: # If API failed logging.warning('Cannot connect to API server! \nIf you think this is wrong, please open an issue at \nhttps://github.com/cnbeining/Biligrab/issues with *ALL* the screen output, \nas well as your IP address and basic system info.') return 0 #---------------------------------------------------------------------- def convert_cookie(cookie_raw): """str->dict 'DedeUserID=358422; DedeUserID__ckMd5=72682a6838d150dd; SESSDATA=72e0ee97%2C1419212650%2C6b47a180' cookie = {'DedeUserID': 358422, 'DedeUserID__ckMd5': '72682a6838d150dd', 'SESSDATA': '72e0ee97%2C1419212650%2C6b47a180'}""" cookie = {} logging.debug('Raw Cookie: ' + cookie_raw) for i in [i.strip() for i in cookie_raw.split(';')]: cookie[i.split('=')[0]] = i.split('=')[1] return cookie #---------------------------------------------------------------------- def getdate(): """None->str 2014-11-23 10:39:46""" return time_old.strftime("%Y-%m-%d %X", time_old.localtime()) #---------------------------------------------------------------------- def post_one(message, rnd, cid, cookie, fontsize = 25, mode = 1, color = 16777215, playTime = 0, pool = 0): """ PARS NOT THE PERFECT SAME AS A PAYLOAD!""" headers = {'Origin': 'http://static.hdslb.com', 'X-Requested-With': 'ShockwaveFlash/15.0.0.223', 'Referer': 'http://static.hdslb.com/play.swf', 'User-Agent': BILIGRAB_UA, 'Host': 'interface.bilibili.com', 'Content-Type': 'application/x-www-form-urlencoded', 'Cookie': cookie} url = 'http://interface.bilibili.com/dmpost' try: date = getdate() payload = {'fontsize': int(fontsize), 'message': str(message), 'mode': int(mode), 'pool': pool, 'color': int(color), 'date': str(date), 'rnd': int(rnd), 'playTime': playTime, 'cid': int(cid)} encoded_args = urllib.parse.urlencode(payload) r = requests.post(url, data = encoded_args, headers = headers) #print(r.text) if int(r.text) <= 0: logging.warning('Line failed:') logging.warning('Message:' + str(message)) else: print(message) #logging.info(message) except Exception as e: print('ERROR: Line failed: %s' % e) print('Payload:' + str(payload)) pass #---------------------------------------------------------------------- def timestamp2sec(timestamp): """""" return (int(timestamp.seconds) + 60 * int(timestamp.minutes) + 3600 * int(timestamp.hours) + float(int(timestamp.hours) / 1000)) #---------------------------------------------------------------------- def read_cookie(cookiepath): """str->list Original target: set the cookie Target now: Set the global header From: Biligrab, https://github.com/cnbeining/Biligrab MIT License""" global BILIGRAB_HEADER try: cookies_file = open(cookiepath, 'r') cookies = cookies_file.readlines() cookies_file.close() # print(cookies) return cookies except: print('WARNING: Cannot read cookie, may affect some videos...') return [''] #---------------------------------------------------------------------- def main(srt, fontsize, mode, color, cookie, aid, p = 1, cool = 2, pool = 0): """str,int,int,int,str,int,int,int,int->None""" rnd = int(random.random() * 1000000000) cid = int(find_cid_api(aid, p)) subs = pysrt.open(srt) for sub in subs: #lasttime = timestamp2sec(sub.stop) - timestamp2sec(sub.start) # For future use playtime = timestamp2sec(sub.start) message = sub.text if '\n' in message: for line in message.split('\n'): post_one(line, rnd, cid, cookie, fontsize, mode, color, playtime, pool) else: post_one(message, rnd, cid, cookie, fontsize, mode, color, playtime, pool) time_old.sleep(int(cool)) print('INFO: DONE!') #---------------------------------------------------------------------- def usage(): """""" print(''' srt2Bilibili https://github.com/cnbeining/srt2bilibili http://www.cnbeining.com/ Beining@ACICFG WARNING: THIS PROGRAMME CAN BE DANGEROUS IF MISUSED, AND CAN LEAD TO UNWANTED CONSEQUNCES, INCLUDING (BUT NOT LIMITED TO) TEMPORARY OR PERMANENT BAN OF ACCOUNT AND/OR IP ADDRESS, DANMAKU POOL OVERSIZE, RUIN OF NORMAL DANMAKU. ONLY USE IF YOU KNOW WHAT YOU ARE DOING. This program is provided **as is**, with absolutely no warranty. Usage: python3 srt2bilibili.py (-h) (-a 12345678) [-p 1] [-c ./bilicookies] (-s 1.srt) [-f 25] [-m 0] [-o 16777215] [-w 2] [-l 0] -h: Default: None Print this usage file. -a: Default: None The av number. -p: Default: 1 The part number. -c Default: ./bilicookies The path of cookies. Should looks like: DedeUserID=123456;DedeUserID__ckMd5=****************;SESSDATA=******************* -s Default: None The srt file you want to post. srt2bilibili will post multi danmakues for multi-line subtitle, since there's a ban on the use of \n. -f Default: 25 The size of danmaku. -m Default: 4 The mode of danmaku. 1: Normal 4: Lower Bound *Suggested 5: Upper Bound 6: Reverse 7: Special 9: Advanced -o Default: 16777215 The colour of danmaku, in integer. -w Default: 2 The cool time (time to wait between posting danmakues) Do not set it too small, which would lead to ban or failure. -l Default: 0 The Danmaku Pool to use. 0: Normal 1: Subtitle 2: Special If you own the video, please set it to 1 to prevent potential lost of danmaku. More info avalable at http://docs.bilibili.cn/wiki/API.comment . ''') if __name__=='__main__': argv_list = [] argv_list = sys.argv[1:] aid, part, cookiepath, srt, fontsize, mode, color, cooltime, playtime, pool = 0, 1, './bilicookies', '', 25, 4, 16777215, 2, 0, 0 try: opts, args = getopt.getopt(argv_list, "ha:p:c:s:f:m:o:l:", ['help', "av", 'part', 'cookie', 'srt', 'fontsize', 'mode', 'color', 'cooltime', 'pool']) except getopt.GetoptError: usage() exit() for o, a in opts: if o in ('-h', '--help'): usage() exit() if o in ('-a', '--av'): aid = a try: argv_list.remove('-a') except: break if o in ('-p', '--part'): part = a try: argv_list.remove('-p') except: part = 1 break if o in ('-c', '--cookie'): cookiepath = a try: argv_list.remove('-c') except: print('INFO: No cookie path set, use default: ./bilicookies') cookiepath = './bilicookies' break if o in ('-s', '--srt'): srt = a try: argv_list.remove('-s') except: break if o in ('-f', '--fontsize'): fontsize = a try: argv_list.remove('-f') except: break if o in ('-m', '--mode'): mode = a try: argv_list.remove('-m') except: mode = 1 break if o in ('-o', '--color'): color = a try: argv_list.remove('-o') except: color = 16777215 break if o in ('-w', '--cooltime'): cooltime = a try: argv_list.remove('-w') except: cooltime = 2 break if o in ('-l', '--pool'): pool = a try: argv_list.remove('-l') except: pool = 0 break if aid == 0: logging.fatal('No aid!') exit() if srt == '': logging.fatal('No srt!') exit() if len(cookiepath) == 0: cookiepath = './bilicookies' cookies = read_cookie(cookiepath) logging.debug('Cookies: ' + cookiepath) BILIGRAB_UA = 'srt2Bilibili / ' + str(VER) + ' (cnbeining@gmail.com)' BILIGRAB_HEADER = {'User-Agent': BILIGRAB_UA, 'Cache-Control': 'no-cache', 'Pragma': 'no-cache', 'Cookie': cookies[0]} logging.debug(cookies[0]) main(srt, fontsize, mode, color, cookies[0], aid, part, cooltime, pool)
126 行那神奇的六个引号是干什么的……没有 docstring 写也要凑一个空的么?
23333333333333333333333333
话说射手字幕站关了你有什么感想?
为什么不让冷却时间随机化呢?
好像B站官方播放器冷却时间是3秒?我们设置成 2~5 秒之间随机怎样?
还有,time_old.sleep 可以填小数。没必要转换成整数。
我的编辑器在定义函数的时候自动出
#———————————————————————-
def ():
“”””””
所以就留下了。
我们的言论审查已经回到了延安时期。当然我是不鸟的:开历史倒车没有好下场。该继续继续。
冷却随机化是可以的,但是,一个600行的双行字幕,就需要1个小时才能发完。这赶上压制一遍的速度了。
我测试0.1秒就够。当然死了不负责。。。
time这个我没想到命名被override了。。。所以写了old。之前的整数是怕速度太快,已经把修改的新版push了。
射手网不是不储存视频吗,基本谈不上版权和审查吧……我是闹不太清楚啦
话说回来有字幕备份在手恢复也不难,而且http://shooter.cn/sub/upload.html还在
恢复快有了。
但是玩文化审查?这不是40年代了。没什么可以被审查了。
开历史倒车没什么好下场。
啊哈,本来想写个js的,用来传ass到字幕池,
唔~~~现在看来没有必要了~~~
PS正在考虑做一个弹幕池项目,(缓慢爬行中)
视频在本地,服务器只储存弹幕,以磁链为弹幕池索引
求感兴趣的来斧正:https://github.com/OpenDanmaku/OpenDanmaku
ass?that s another story。
ASS涉及到字体,所以必须要高级弹幕。我是写不出这种翻译器了,所以就得这样了:统统srt的干活吧。
这个项目很有意思。。。去中心化就更有意思了。那就是真正的开放弹幕了啊。。。。
那就需要一个与bt或magnet或ed2k绑定的分布式IRC
(或IRC插件,利用这些协议现有的,或者自己设计的单独的聊天信道),
客户端监听每个anonymous user发布弹幕时的广播,
互相传递本地弹幕cache,并用guid来去除重复
而且仍然可以实现云屏蔽(用户对某条弹幕/某人标记dislike),
跨弹幕池引用(针对不同字幕组/合集,当然要做时间轴调整)等等
Good idea……不过我没有这个本事实现它……lol,
事实上身为web初心,做现在这个项目也很困难,真希望有更合适的人来做啊……
从好处想,这是一个去中心化的对特定区域广播机制。可以做什么你懂的。
当然我就是这么一说。。。而且得不到北美和欧洲开源界的支持 不好办啊。。。
先看看非去中心的这个磁链弹幕库能不能吸引人气吧…
git更新了一点…夜半写代码好累…
带弱中心的去中心化弹幕库?好主意。。。
拿这个点子去找大站吧。
服务端大致写了一点,(虽然很不像话但是尽力了),求提意见,求斧正
https://github.com/OpenDanmaku/OpenDanmaku
咱是渣渣,不敢多言。。。
总之尽可能帮忙吧。
ASS可以先用https://pypi.python.org/pypi/asstosrt/0.1.3 转成SRT,然后srt2Bilibili走起。。。