anki-word-query/addons/fastwq/service/dict/baidu_chinese.py

104 lines
3.2 KiB
Python
Raw Normal View History

2018-07-07 22:51:01 +08:00
#-*- coding:utf-8 -*-
2018-07-30 17:42:14 +08:00
import os
from ..base import *
2018-07-07 22:51:01 +08:00
baidu_download_mp3 = True
2018-07-14 01:18:03 +08:00
@register([u'百度汉语', u'Baidu-Hanyu'])
2018-07-07 22:51:01 +08:00
class Baidu_Chinese(WebService):
def __init__(self):
super(Baidu_Chinese, self).__init__()
def _get_content(self):
2018-07-30 17:42:14 +08:00
url = u"http://dict.baidu.com/s?wd={}#basicmean".format(self.quote_word)
2018-07-07 22:51:01 +08:00
html = self.get_response(url, timeout=10)
2018-07-13 22:08:35 +08:00
soup = parse_html(html)
2018-07-07 22:51:01 +08:00
result = {
'pinyin': '',
'basicmean': '',
'detailmean': '',
2018-07-07 22:51:01 +08:00
'fanyi': '',
'audio_url': '',
}
#拼音
element = soup.find('div', id='pinyin')
if element:
tag = element.find_all('b')
if tag:
result['pinyin'] = u' '.join(x.get_text() for x in tag)
if tag:
tag = element.find('a')
if tag:
result['audio_url'] = tag.get('url')
2018-07-07 22:51:01 +08:00
#基本释义
element = soup.find('div', id='basicmean-wrapper')
if element:
2018-07-08 17:39:21 +08:00
tag = element.find_all('div', {'class': 'tab-content'})
2018-07-07 22:51:01 +08:00
if tag:
2018-07-26 20:28:46 +08:00
result['basicmean'] = u''.join(str(x).decode('utf-8') for x in tag)
#详细释义
element = soup.find('div', id='detailmean-wrapper')
if element:
2018-07-08 17:39:21 +08:00
tag = element.find_all('div', {'class': 'tab-content'})
if tag:
2018-07-26 20:28:46 +08:00
result['detailmean'] = u''.join(str(x).decode('utf-8') for x in tag)
2018-07-07 22:51:01 +08:00
#英文翻译
element = soup.find('div', id='fanyi-wrapper')
if element:
tag = element.find_all('dt')
if tag:
result['fanyi'] = u'<br>'.join(x.get_text().strip() for x in tag)
return self.cache_this(result)
def _get_field(self, key, default=u''):
return self.cache_result(key) if self.cached(key) else self._get_content().get(key, default)
2018-07-08 17:39:21 +08:00
@with_styles(need_wrap_css=True, cssfile='_baidu.css')
def _css(self, val):
return val
2018-07-13 22:08:35 +08:00
@export([u'拼音', u'Phoneticize'])
2018-07-07 22:51:01 +08:00
def fld_pinyin(self):
return self._get_field('pinyin')
2018-07-13 22:08:35 +08:00
@export('PRON')
2018-07-07 22:51:01 +08:00
def fld_pron(self):
audio_url = self._get_field('audio_url')
if baidu_download_mp3 and audio_url:
filename = u'_baidu_chinese_{}_.mp3'.format(self.word)
2018-07-30 17:42:14 +08:00
filename = get_hex_name(self.unique.lower(), filename, 'mp3')
2018-07-07 22:51:01 +08:00
try:
2018-07-30 17:42:14 +08:00
if os.path.exists(filename) or self.net_download(
2018-07-07 22:51:01 +08:00
filename,
audio_url,
2018-07-30 17:42:14 +08:00
require=dict(mime='audio/mp3', size=512)
):
return self.get_anki_label(filename, 'audio')
2018-07-07 22:51:01 +08:00
except:
pass
return ''
2018-07-13 22:08:35 +08:00
@export([u'基本释义', u'Basic Definitions'])
2018-07-07 22:51:01 +08:00
def fld_basic(self):
2018-07-08 17:39:21 +08:00
val = self._get_field('basicmean')
if val is None or val == '':
return ''
return self._css(val)
2018-07-07 22:51:01 +08:00
2018-07-13 22:08:35 +08:00
@export([u'详细释义', u'Detail Definitions'])
def fld_detail(self):
2018-07-08 17:39:21 +08:00
val = self._get_field('detailmean')
if val is None or val == '':
return ''
return self._css(val)
2018-07-13 22:08:35 +08:00
@export([u'英文翻译', u'Translation[En]'])
2018-07-07 22:51:01 +08:00
def fld_fanyi(self):
return self._get_field('fanyi')