update
This commit is contained in:
parent
c2cad265cb
commit
dafee9e18d
@ -1,6 +1,5 @@
|
|||||||
"""
|
"""
|
||||||
This code is supported by the website: https://www.guanjihuan.com
|
This code is supported by the website: https://www.guanjihuan.com
|
||||||
The newest version of this code is on the web page: https://www.guanjihuan.com/archives/18038
|
|
||||||
"""
|
"""
|
||||||
|
|
||||||
from bs4 import BeautifulSoup
|
from bs4 import BeautifulSoup
|
@ -0,0 +1,33 @@
|
|||||||
|
"""
|
||||||
|
This code is supported by the website: https://www.guanjihuan.com
|
||||||
|
"""
|
||||||
|
|
||||||
|
from urllib import response
|
||||||
|
from bs4 import BeautifulSoup
|
||||||
|
import re
|
||||||
|
import requests
|
||||||
|
import urllib.request
|
||||||
|
import os
|
||||||
|
import ssl
|
||||||
|
from urllib.request import urlopen
|
||||||
|
|
||||||
|
ssl._create_default_https_context = ssl._create_unverified_context
|
||||||
|
html = urllib.request.urlopen("https://www.guanjihuan.com/archives/10897").read().decode('utf-8')
|
||||||
|
soup = BeautifulSoup(html, features='lxml')
|
||||||
|
all_a_tag = soup.find_all('a', href=True)
|
||||||
|
for a_tag in all_a_tag:
|
||||||
|
href = a_tag['href']
|
||||||
|
if re.search('https://www.merriam-webster.com/dictionary/', href):
|
||||||
|
print(href[43:])
|
||||||
|
exist = os.path.exists('prons/'+href[43:]+'.mp3')
|
||||||
|
if exist:
|
||||||
|
continue
|
||||||
|
header = {'User-Agent':'Mozilla/5.0 (X11; Fedora; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.3029.110 Safari/537.36'} # 头部信息
|
||||||
|
html = urlopen(href).read().decode('utf-8')
|
||||||
|
mp3_file = re.findall('https://media.merriam-webster.com/audio/prons/en/us/mp3/.*.mp3",', html, re.S)[0][:-2]
|
||||||
|
print(mp3_file[:-2])
|
||||||
|
print()
|
||||||
|
r = requests.get(mp3_file, headers=header, stream=True)
|
||||||
|
with open('prons/'+href[43:]+'.mp3', 'wb') as f:
|
||||||
|
for chunk in r.iter_content(chunk_size=32):
|
||||||
|
f.write(chunk)
|
@ -0,0 +1,8 @@
|
|||||||
|
# Words in webpage: https://www.guanjihuan.com/archives/10897
|
||||||
|
# installation:
|
||||||
|
# (1) pip install pygame
|
||||||
|
# (2) pip install --upgrade guan
|
||||||
|
|
||||||
|
import guan
|
||||||
|
guan.play_element_words()
|
||||||
|
# guan.play_element_words(random_on=0, show_translation=1, show_link=1, translation_time=2, rest_time=1)
|
Loading…
x
Reference in New Issue
Block a user