This was determined programmatically by means of trying to do a simple HTTP request to / of any of the URLs given: ```python from lxml import etree from urllib import parse import requests doc = etree.parse("ultimate_providers.xml") root = doc.getroot() for provider in root: parsed_url = parse.urlparse(provider.get("url")) url = f"{parsed_url.scheme}://{parsed_url.netloc}/" try: requests.head(url, timeout=5) except Exception as e: print(parsed_url.netloc) ``` Note that these were also removed from songinfoview as present, and from outgoingdatacreator. The two lists there were found to be inconsistent, but this isn't subject of this PR. Signed-off-by: Marcus Müller <>
267 lines
13 KiB
267 lines
13 KiB
<?xml version="1.0" encoding="UTF-8"?>
<provider name="" title="{artist} LYRICS - {title}" charset="utf-8" url="{artist}/{title}.html">
<urlFormat replace=" ._@,;&\/()'"-" with=""/>
<item begin="<!-- Usage of content by any third-party lyrics provider is prohibited by our licensing agreement. Sorry about that. -->" end="</div>"/>
<item tag="<B>"/>
<item begin="<i>[" end="]</i>"/>
<item begin="[" end="]"/>
<invalidIndicator value="<h1>Welcome to AZLyrics!</h1>"/>
<provider name=" (Bollywood songs)" title="{title} Song Lyrics -" charset="utf-8" url="{Title}">
<urlFormat replace=" _@;\/"'()[]" with="-"/>
<urlFormat replace="?" with=""/>
<item begin="<div class="entry-content">" end="</div>"/>
<invalidIndicator value="Couldn't find that page."/>
<provider name="" title ="{ARTIST} LYRICS - "{title}" ({year}) album" charset="utf-8" url="{artist2}/{album2}.html">
<item begin="<h3><a name="{track}">{track}. {Title2}</a></h3><br />" end="<h3>"/>
<item begin="<h3><a name="{track}">{track}. {Title2}</a></h3><br />" end="<div class="thanks">"/>
<invalidIndicator value="The page you requested was not found on"/>
<provider name="" title="{artist} - {title} lyrics" charset="iso-8859-1" url="{artist}-{title}-lyrics.html">
<urlFormat replace=" _@,;&\/'"" with="-"/>
<urlFormat replace="." with=""/>
<item tag="<div id="lyricsContent">"/>
<item tag="<p>"/>
<item begin="<b>" end="</b>"/>
<provider name="" title="{title} Lyrics - {artist}" charset="iso-8859-1" url="{a}/{artist}-lyrics/{title}-lyrics.html">
<urlFormat replace=" _@;&\/"" with="-"/>
<urlFormat replace="'" with="_"/>
<item tag="<div class='ly' style='font-size:12px;'>"/>
<item tag="<strong>"/>
<item tag="<em>"/>
<invalidIndicator value="Page not Found"/>
<provider name="Encyclopaedia Metallum" title="{title Lyrics - {artist}" charset="utf-8" url="{title}&bandName={artist}&ExactBandMatch=1">
<item url="{id}"/>
<item begin="id=\"lyricsLink_" end="""/>
<invalidIndicator value=""iTotalRecords": 0"/>
<invalidIndicator value="lyrics not available"/>
<provider name="" charset="utf-8" url="{artist}-{title}-lyrics">
<urlFormat replace=",._@!#%^*+;\/"'()[]" with=""/>
<urlFormat replace=" :" with="-"/>
<!-- When $ is used as the dollar sign it is omitted from the url
When $ is used instead of 's',
in some cases it is replaced by 's'(Too $hort -> too-short)
in other cases it is omitted ($uicideboy$ -> uicideboy)
I chose to omit it though, in some cases it's gonna be problematic -->
<urlFormat replace="$" with=""/>
<urlFormat replace="ÄÂÀÁÃäâàáã" with="a"/>
<urlFormat replace="ËÊÈÉëêèé" with="e"/>
<urlFormat replace="ÏÌïì" with="i"/>
<urlFormat replace="ÖÔÒÓÕöôòóõ" with="o"/>
<urlFormat replace="ÜŪÙÚüūùú" with="u"/>
<urlFormat replace="ŸÝÿý" with="y"/>
<urlFormat replace="Ññ" with="n"/>
<urlFormat replace="Çç" with="c"/>
<urlFormat replace="ß" with="ss"/>
<urlFormat replace="&" with="and"/>
<item tag="<div class="lyrics">"/>
<item begin="<!--" end="-->"/>
<item begin="<a href=" end=">"/>
<item begin="</a" end=">"/>
<provider name="" title="" charset="utf-8" url="{title}&artista={artist}">
<urlFormat replace="_@,;&\/"" with="_"/>
<urlFormat replace=" " with="+"/>
<item begin="</div>" end="</div>"/>
<invalidIndicator value="Verifique se o nome do seu arquivo e sua"/>
<provider name="" title="" charset="utf-8" url="{artist}&track={title}">
<urlFormat replace="_@,;&\/"#" with="_"/>
<item tag="<response>"/>
<invalidIndicator value="ERROR"/>
<provider name="" title="{artist} - {title} Lyrics" charset="utf-8" url="{artist}/{title}.html">
<urlFormat replace=" _@,;&\/"" with="-"/>
<urlFormat replace="'." with=""/>
<item tag="<div id="lyrics" class="SCREENONLY">"/>
<item begin="<br><br><a target='_blank'" end="></a>"/>
<invalidIndicator value="Click to search for the Lyrics on"/>
<invalidIndicator value="we do not have the lyric for this song"/>
<provider name="" title="{artist}:{title} Lyrics - " charset="utf-8" url="{Artist}:{Title}">
<urlFormat replace=" _@;\"" with="_"/>
<urlFormat replace="?" with="%3F"/>
<item begin="<div class='lyricbox'>" end="<div class='lyricsbreak'"/>
<item tag="<div class='rtMatcher'>"/>
<item tag="<span style="padding:1em">"/>
<provider name="" title="{title} lyrics {artist}" charset="iso-8859-1" url="{title}_lyrics-{artist}.html">
<urlFormat replace=" _@,;&\/'"" with="_"/>
<urlFormat replace="." with=""/>
<item tag="<div id=EchoTopic>"/>
<item tag="<textarea name="songscpy" id="songscpyid" onclick="callselect('songscpyid','selectswf')" rows="3" cols="45" READONLY>"/>
<provider name="" title="{artist} - {title} LYRICS" charset="utf-8" url="{artist}-{title}-lyrics.html">
<urlFormat replace=" _@,;&\/"" with="-"/>
<urlFormat replace="." with=""/>
<item tag="<div id="div_customCSS">"/>
<invalidIndicator value="We haven't lyrics of this song"/>
<provider name="" title="{artist} - {title} Lyrics" charset="iso-8859-1" url="{title}_lyrics_{artist}.html">
<urlFormat replace=" _@;&\/"'." with="_"/>
<item begin="<span style="font-size:14px;">" end="<span style="font-size:14px;">"/>
<item begin="</center>" end="<a"/>
<invalidIndicator value="The lyrics you requested is not in our archive yet,"/>
<provider name="" title="{artist} - {title} lyrics" charset="iso-8859-1" url="{a}/{artist}/{title}.html">
<urlFormat replace=" ._@,;&\/"" with="_"/>
<item tag="<div id='songlyrics_h' class='dn'>"/>
<invalidIndicator value="Sorry, we have no"/>
<provider name="" title="{artist} - {title} Lyrics" charset="utf-8" url="{title}&artist={artist}">
<urlFormat replace="_@;&\/"" with="-"/>
<urlFormat replace="'" with=""/>
<urlFormat replace=" " with="%20"/>
<item tag="<div id="lyrics">"/>
<provider name="" title="{title} lyrics {artist}" charset="iso-8859-1" url="{artist}/{title}/">
<urlFormat replace=" _@,;&\/"" with="+"/>
<urlFormat replace="'." with=""/>
<item begin="Ringtone to your Cell" end="Ringtone to your Cell"/>
<item begin="<div style="text-align:center;">" end="<a"/>
<invalidIndicator value="Page not Found"/>
<provider name="" title="" charset="utf-8" url="{artist}:{title}">
<urlFormat replace=" _@,;&\/"" with="_"/>
<urlFormat replace="." with=""/>
<item begin="</table>" end="<div class="printfooter">"/>
<item tag="<p>"/>
<provider name="" title="{artist} &quot;{title}&quot; Lyrics" charset="utf-8" url="{a}/{artist}/{title}/">
<urlFormat replace=" _@,;&\/"" with="-"/>
<urlFormat replace="'." with=""/>
<item tag="<span id=gn_lyricsB>"/>
<item tag="<div class="KonaBody" id="EchoTopic">"/>
<item tag="<font size=2>"/>
<item begin="<b><i>" end="</u></b>:"/>
<item begin="<b>Lyrics" end="</b>"/>
<invalidIndicator value="Something went wrong"/>
<provider name="" title="{artist} - {title} lyrics | Musixmatch" charset="utf-8" url="{Artist}/{Title}">
<urlFormat replace=" _@;\/"'()[]" with="-"/>
<urlFormat replace="?" with=""/>
<item begin="<span id="lyrics-html"" end="</span>"/>
<item begin=" data-reactid="" end="">"/>
<invalidIndicator value="We couldn't find that page."/>
<provider name="" title="{title} LYRICS - {artist}" charset="utf-8" url="{artist}/{title}-lyrics/">
<urlFormat replace=" ._@,;&\/"" with="-"/>
<urlFormat replace="'" with="_"/>
<item tag="<p id="songLyricsDiv" ondragstart="return false;" onselectstart="return false;" oncontextmenu="return false;" class="songLyricsV14" style="font-size: 14px;z-index: 9999;position: absolute;left: -6000px;">"/>
<item begin=" [" end="] "/>
<invalidIndicator value="Sorry, we have no"/>
<invalidIndicator value="This is an upcoming album and we do not have the"/>
<provider name=" (Original lyric language)" title="{artist} - {title} - tekst" charset="utf-8" url=",{artist},{title}.html">
<urlFormat replace=" _@,;&\/'"." with="_"/>
<item begin="<div class="song-text">" end="<a href="javascript:;""/>
<item tag="<div class="tlumaczenie">"/>
<item begin="<h2>" end="</h2><br />"/>
<provider name=" (Translated to Polish)" title="{artist} - {title} - tekst" charset="utf-8" url=",{artist},{title}.html">
<urlFormat replace=" _@,;&\/'"." with="_"/>
<item begin="<div id="translation" class=" end="<a href="/>
<item begin=""id-" end="">"/>
<provider name="" title="{artist} - {title} - tekst" charset="utf-8" url="{artist},{title},tekst-piosenki">
<urlFormat replace=" _@,;&\/"'" with="-"/>
<urlFormat replace="." with=""/>
<item begin="<div class="songText" id="songContent">" end="</div>"/>
<provider name="" title="{title} de {artist} no VAGALUME" charset="iso-8859-1" url="{artist}/{title}.html">
<urlFormat replace=" _@,;&\/'"." with="-"/>
<item tag="<span class="editable_area">"/>
<provider name=" (Portuguese translations)" title="{title} de {artist} no VAGALUME" charset="iso-8859-1" url="{artist}/{title}-traducao.html">
<urlFormat replace=" _@,;&\/'"." with="-"/>
<item tag="<div class="tab_traducao sideBySide lyricArea tab_tra_pt">"/>