anki-word-query/src/fastwq/service/dict/yahoo.py

87 lines
2.7 KiB
Python
Raw Normal View History

2018-07-26 19:45:39 +08:00
# -*- coding:utf-8 -*-
import os
from hashlib import sha1
from ..base import WebService, export, register, with_styles, parse_html
yahoo_download_mp3 = True
@register([u'雅虎奇摩字典', u'Yahoo-Dict'])
class Yahoo_Dict(WebService):
def __init__(self):
super(Yahoo_Dict, self).__init__()
def _get_content(self):
url = u"https://tw.dictionary.search.yahoo.com/search?p={}".format(
self.word)
html = self.get_response(url, timeout=10)
soup = parse_html(html)
result = {
'phon': '',
'def': '',
'audio_url': '',
}
# 基本
element = soup.find(
'div', class_='dd cardDesign dictionaryWordCard sys_dict_word_card')
if element:
# 音标
tag = element.find('div', class_='compList ml-25 d-ib')
if tag:
result['phon'] = tag.get_text()
# 发音
result['audio_url'] = u'https://s.yimg.com/bg/dict/dreye/live/f/{}.mp3'.format(
self.word)
# 词性及中文解释
tag = element.find('div', class_='compList mb-25 ml-25 p-rel')
if tag:
result['def'] = u'<div class="dd cardDesign">' + \
str(tag.find('ul')).decode('utf-8') + u'</div>'
return self.cache_this(result)
def _get_field(self, key, default=u''):
return self.cache_result(key) if self.cached(key) else self._get_content().get(key, default)
@with_styles(need_wrap_css=True, cssfile='_yahoo.css')
def _css(self, val):
return val
@export(u'音标')
def fld_pinyin(self):
return self._get_field('phon')
@export(u'发音')
def fld_pron(self):
audio_url = self._get_field('audio_url')
if yahoo_download_mp3 and audio_url:
filename = u'_yahoo_dict_{}_.mp3'.format(self.word)
hex_digest = sha1(
self.word.encode('utf-8') if isinstance(self.word, unicode)
else self.word
).hexdigest().lower()
assert len(hex_digest) == 40, "unexpected output from hash library"
filename = '.'.join([
'-'.join([
self.unique.lower(
), hex_digest[:8], hex_digest[8:16],
hex_digest[16:24], hex_digest[24:32], hex_digest[32:],
]),
'mp3',
])
if os.path.exists(filename) or self.download(audio_url, filename, 5):
return self.get_anki_label(filename, 'audio')
return ''
@export(u'中文释义')
def fld_basic(self):
val = self._get_field('def')
if val is None or val == '':
return ''
return self._css(val)