106 行
2.5 KiB
Python
106 行
2.5 KiB
Python
"""
|
|
ニコニコのニジカ動画取得モヂュール
|
|
"""
|
|
|
|
from typing import TypedDict, cast
|
|
|
|
import requests
|
|
from bs4 import BeautifulSoup
|
|
from requests.exceptions import Timeout
|
|
|
|
KIRIBAN_VIEWS_COUNTS = { *range (100, 1_000, 100),
|
|
*range (1_000, 10_000, 1_000),
|
|
*range (10_000, 1_000_001, 10_000),
|
|
194, 245, 510, 114_514, 1_940, 2_450, 5_100, 24_500,
|
|
51_000, 2_424 }
|
|
|
|
|
|
class VideoInfo (TypedDict):
|
|
contentId: str
|
|
title: str
|
|
tags: list[str]
|
|
description: str
|
|
|
|
|
|
def get_latest_deerjika (
|
|
) -> VideoInfo | None:
|
|
tag = '伊地知ニジカ OR ぼざろクリーチャーシリーズ'
|
|
url = f"https://www.nicovideo.jp/tag/{ tag }"
|
|
|
|
params = { 'sort': 'f',
|
|
'order': 'd' }
|
|
|
|
video_info = { }
|
|
|
|
bs = get_bs_from_url (url, params)
|
|
if bs is None:
|
|
return None
|
|
|
|
try:
|
|
video = (bs.find_all ('ul', class_ = 'videoListInner')[1]
|
|
.find ('li', class_ = 'item'))
|
|
|
|
video_info['contentId'] = video['data-video-id']
|
|
except Exception:
|
|
return None
|
|
|
|
bs = get_bs_from_url ('https://www.nicovideo.jp/watch/'
|
|
+ video_info['contentId'])
|
|
if bs is None:
|
|
return None
|
|
|
|
try:
|
|
title = bs.find ('title')
|
|
if title is None:
|
|
return None
|
|
video_info['title'] = '-'.join (title.text.split ('-')[:(-1)])[:(-1)]
|
|
|
|
tags: str = bs.find ('meta', attrs = { 'name': 'keywords' }).get ('content') # type: ignore
|
|
video_info['tags'] = tags.split (',')
|
|
|
|
video_info['description'] = bs.find ('meta', attrs = { 'name': 'description' }).get ('content') # type: ignore
|
|
except Exception:
|
|
return None
|
|
|
|
return cast (VideoInfo, video_info)
|
|
|
|
|
|
def get_bs_from_url (
|
|
url: str,
|
|
params: dict = { },
|
|
) -> BeautifulSoup | None:
|
|
"""
|
|
URL から BeautifulSoup インスタンス生成
|
|
|
|
Parameters
|
|
----------
|
|
url: str
|
|
捜査する URL
|
|
params: dict
|
|
パラメータ
|
|
|
|
Return
|
|
------
|
|
BeautifulSoup | None
|
|
BeautifulSoup オブゼクト(失敗したら None)
|
|
"""
|
|
|
|
try:
|
|
req = requests.get (url, params = params, timeout = 60)
|
|
except Timeout:
|
|
return None
|
|
|
|
if req.status_code != 200:
|
|
return None
|
|
|
|
req.encoding = req.apparent_encoding
|
|
|
|
return BeautifulSoup (req.text, 'html.parser')
|
|
|
|
|
|
def get_kiriban_list (
|
|
) -> list[tuple[int, VideoInfo]]:
|
|
kiriban_list: list[tuple[int, VideoInfo]] = []
|
|
|
|
|