music-dl/src/extractors/zaycev.py

#!/usr/bin/env python
# -*- coding: UTF-8 -*-
from __future__ import unicode_literals    # at top of module
import re
import json
import requests
import logging
from bs4 import BeautifulSoup
from . import baseFile

log = logging.getLogger("extractors.zaycev.net")

class interface(object):
	name = "zaycev.net"

	def __init__(self):
		self.results = []
		self.needs_transcode = False
		log.debug("Started extraction service for zaycev.net")

	def search(self, text, page=1):
		if text == "" or text == None:
			raise ValueError("Text must be passed and should not be blank.")
		site = "http://zaycev.net/search.html?query_search=%s" % (text,)
		log.debug("Retrieving data from {0}...".format(site,))
		r = requests.get(site)
		soup = BeautifulSoup(r.text, 'html.parser')
		search_results = soup.find_all("div", {"class": "musicset-track__title track-geo__title"})
		self.results = []
		for i in search_results:
			# The easiest method to get artist and song names is to fetch links. There are only two links per result here.
			data = i.find_all("a")
			# from here, data[0] contains artist info and data[1] contains info of the retrieved song.
			s = baseFile.song(self)
			s.title = data[1].text
			s.artist = data[0].text
			s.url = "http://zaycev.net%s" % (data[1].attrs["href"])
#			s.duration = self.hd[i]["duration"]
#			s.size = self.hd[i]["size"]
#			s.bitrate = self.hd[i]["bitrate"]
			self.results.append(s)
		log.debug("{0} results found.".format(len(self.results)))

	def get_download_url(self, url):
		log.debug("Getting download URL for {0}".format(url,))
		soups = BeautifulSoup(requests.get(url).text, 'html.parser')
		data = json.loads(requests.get('http://zaycev.net' + soups.find('div', {'class':"musicset-track"}).get('data-url')).text)
		log.debug("Download URL: {0}".format(data["url"]))
		return data["url"]

	def format_track(self, item):
		return "{0}. {1}. {2}".format(item.title, item.duration, item.size)
Added extractors package 2018-01-23 13:39:49 -06:00			`#!/usr/bin/env python`
			`# -- coding: UTF-8 --`
Additions to make code more compatible for py2 and py3 2018-03-04 12:29:25 -06:00			`from __future__ import unicode_literals # at top of module`
Added extractors package 2018-01-23 13:39:49 -06:00			`import re`
			`import json`
			`import requests`
Added logging to almost everything here 2018-03-12 17:11:05 -06:00			`import logging`
Added extractors package 2018-01-23 13:39:49 -06:00			`from bs4 import BeautifulSoup`
Added track formatting into baseSong. 2018-01-24 17:41:18 -06:00			`from . import baseFile`
Added extractors package 2018-01-23 13:39:49 -06:00
Added logging to almost everything here 2018-03-12 17:11:05 -06:00			`log = logging.getLogger("extractors.zaycev.net")`

Added extractors package 2018-01-23 13:39:49 -06:00			`class interface(object):`
Fixed search selector issue. Fixed #2 2018-07-11 11:21:55 -05:00			`name = "zaycev.net"`
Added extractors package 2018-01-23 13:39:49 -06:00
			`def __init__(self):`
			`self.results = []`
Specifies if results taken from an extractor interface requires VLC transcoding or can be directly downloaded in mp3 2018-02-25 04:54:18 -06:00			`self.needs_transcode = False`
Added logging to almost everything here 2018-03-12 17:11:05 -06:00			`log.debug("Started extraction service for zaycev.net")`
Added extractors package 2018-01-23 13:39:49 -06:00
			`def search(self, text, page=1):`
Fixed extractors based in tests results 2018-12-29 20:18:20 -06:00			`if text == "" or text == None:`
			`raise ValueError("Text must be passed and should not be blank.")`
Fixed zaycev.net extractor 2018-12-28 19:46:26 -06:00			`site = "http://zaycev.net/search.html?query_search=%s" % (text,)`
Added logging to almost everything here 2018-03-12 17:11:05 -06:00			`log.debug("Retrieving data from {0}...".format(site,))`
Added extractors package 2018-01-23 13:39:49 -06:00			`r = requests.get(site)`
			`soup = BeautifulSoup(r.text, 'html.parser')`
Fixed zaycev.net extractor 2018-12-28 19:46:26 -06:00			`search_results = soup.find_all("div", {"class": "musicset-track__title track-geo__title"})`
Added extractors package 2018-01-23 13:39:49 -06:00			`self.results = []`
Fixed zaycev.net extractor 2018-12-28 19:46:26 -06:00			`for i in search_results:`
			`# The easiest method to get artist and song names is to fetch links. There are only two links per result here.`
			`data = i.find_all("a")`
			`# from here, data[0] contains artist info and data[1] contains info of the retrieved song.`
Items can requests their download URL by themselves 2018-01-26 11:52:18 -06:00			`s = baseFile.song(self)`
Fixed zaycev.net extractor 2018-12-28 19:46:26 -06:00			`s.title = data[1].text`
			`s.artist = data[0].text`
			`s.url = "http://zaycev.net%s" % (data[1].attrs["href"])`
			`# s.duration = self.hd[i]["duration"]`
			`# s.size = self.hd[i]["size"]`
			`# s.bitrate = self.hd[i]["bitrate"]`
Added extractors package 2018-01-23 13:39:49 -06:00			`self.results.append(s)`
Added logging to almost everything here 2018-03-12 17:11:05 -06:00			`log.debug("{0} results found.".format(len(self.results)))`
Added extractors package 2018-01-23 13:39:49 -06:00
			`def get_download_url(self, url):`
Added logging to almost everything here 2018-03-12 17:11:05 -06:00			`log.debug("Getting download URL for {0}".format(url,))`
Added extractors package 2018-01-23 13:39:49 -06:00			`soups = BeautifulSoup(requests.get(url).text, 'html.parser')`
			`data = json.loads(requests.get('http://zaycev.net' + soups.find('div', {'class':"musicset-track"}).get('data-url')).text)`
Added logging to almost everything here 2018-03-12 17:11:05 -06:00			`log.debug("Download URL: {0}".format(data["url"]))`
			`return data["url"]`

			`def format_track(self, item):`
			`return "{0}. {1}. {2}".format(item.title, item.duration, item.size)`