183 lines
10 KiB
XML
183 lines
10 KiB
XML
|
<?xml version="1.0" encoding="UTF-8"?>
|
||
|
<scraper framework="1.1" date="2013-05-29">
|
||
|
<NfoUrl dest="3">
|
||
|
<RegExp input="$$1" output="<url>$INFO[mbsite]/ws/2/artist/\1?inc=url-rels</url>" dest="3">
|
||
|
<expression>musicbrainz.org/artist/(.+)</expression>
|
||
|
</RegExp>
|
||
|
</NfoUrl>
|
||
|
<ResolveIDToUrl dest="3">
|
||
|
<RegExp input="$$1" output="<url>$INFO[mbsite]/ws/2/artist/\1?inc=url-rels</url>" dest="3">
|
||
|
<expression>(.+)</expression>
|
||
|
</RegExp>
|
||
|
</ResolveIDToUrl>
|
||
|
|
||
|
<CreateArtistSearchUrl dest="3">
|
||
|
<RegExp input="$$1" output="<url>$INFO[mbsite]/ws/2/artist/?fmt=xml&query=artist:"$$4"&limit=100</url>" dest="3">
|
||
|
<RegExp input="$$1" output="\1" dest="4">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$1" output="\1" dest="6">
|
||
|
<expression noclean="1">(.+)(?:Ft%2e|Feat%2e|%20Ft\.|%20Feat\.|%20and%20)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$6" output="\1" dest="4">
|
||
|
<expression>(.+)</expression>
|
||
|
</RegExp>
|
||
|
<expression/>
|
||
|
</RegExp>
|
||
|
</CreateArtistSearchUrl>
|
||
|
<GetArtistSearchResults dest="8">
|
||
|
<RegExp input="$$5" output="<results sorted="yes">\1</results>" dest="8">
|
||
|
<RegExp input="$$1" output="<entity><title>\2</title><disambiguation>\4</disambiguation><url cache="mb-\1-artist.xml">$INFO[mbsite]/ws/2/artist/\1?inc=url-rels</url></entity>" dest="9">
|
||
|
<expression repeat="yes" noclean="1">artist\sid="([^"]*)"(?:\stype="[^"]*")*(?:\stype-id="[^"]*")*?\s.*?score="[^"]*"><name>([^<]*)</name>(<sort-name>[^<]*</sort-name>)?(?:<gender>[^<]*</gender>)*(?:<country>[^<]*</country>)*(?:<area.*?</area>)*(?:<begin-area.*?</begin-area>)*(?:<disambiguation>(.*?)</disambiguation>)*</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$9" output="\1" dest="5">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<expression noclean="1"/>
|
||
|
</RegExp>
|
||
|
</GetArtistSearchResults>
|
||
|
<GetArtistDetails dest="3" clearbuffers="no">
|
||
|
<RegExp input="$$5" output="<details>\1</details>" dest="3">
|
||
|
<!--MBID - Artist-->
|
||
|
<RegExp input="$$1" output="\1" dest="5">
|
||
|
<expression noclean="1"><artist(.*?)<name>([^<]*)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$5" output="\1" dest="8">
|
||
|
<expression noclean="1">\sid="([^"]*)"</expression>
|
||
|
</RegExp>
|
||
|
<!--AMGID - Artist-->
|
||
|
<RegExp input="$$1" output="\2" dest="9">
|
||
|
<expression noclean="1">>http.?://(www.)?allmusic.com/artist/([^<]*)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$1" output="<musicBrainzArtistID>$$8</musicBrainzArtistID><name>\1</name>" dest="5">
|
||
|
<expression noclean="1"><artist.*?<name>([^<]*)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$1" output="<sortname>\1</sortname>" dest="5+">
|
||
|
<expression noclean="1"><artist.*?<sort-name>([^<]*)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$1" output="<type>\1</type>" dest="5+">
|
||
|
<expression noclean="1"><artist.*?\stype="(Person|Group|Orchestra|Choir|Character|Other)"</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$1" output="<gender>\1</gender>" dest="5+">
|
||
|
<expression noclean="1"><gender.*?>([^<]*)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$1" output="<disambiguation>\1</disambiguation>" dest="5+">
|
||
|
<expression noclean="1"><disambiguation>([^<]*)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="fanarttvthumbs" output="<chain function="GetFanartTvArtistThumbsByMBID">\1</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="fanarttvartistcl" output="<chain function="GetFanartTvArtistClearlogoByMBID">\1</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="fanarttvartistbanner" output="<chain function="GetFanartTvArtistBannerByMBID">\1</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="tadbthumbs" output="<chain function="GetTADBArtistThumbsByMBID">$$8</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="tadbartistclearlogo" output="<chain function="GetTADBArtistClearlogoByMBID">$$8</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="tadbartistclearart" output="<chain function="GetTADBArtistClearartByMBID">$$8</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="tadbartistlandscape" output="<chain function="GetTADBArtistLandscapeByMBID">$$8</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="tadbartistbanner" output="<chain function="GetTADBArtistBannerByMBID">$$8</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="fanarttvfanart" output="<chain function="GetFanartTvArtistFanartsByMBID">\1</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$8" conditional="tadbfanart" output="<chain function="GetTADBArtistFanartsByMBID">$$8</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$9" output="<chain function="GetAMGData">\1</chain>" dest="5+">
|
||
|
<expression noclean="1">(.+)</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$$9" output="<chain function="AMGFallback">\1</chain>" dest="5+">
|
||
|
<expression noclean="1">^$</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[discogsource]" output="<chain function="GetMBDiscographyByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>MusicBrainz</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[lifespansource]" output="<chain function="GetMBLafeSpanByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>MusicBrainz</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[biogsource]" output="<chain function="GetTADBBiographyByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>TheAudioDb.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[genressource]" output="<chain function="GetTADBArtistGenresByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>TheAudioDb.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[stylessource]" output="<chain function="GetTADBArtistStylesByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>TheAudioDb.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[moodssource]" output="<chain function="GetTADBArtistMoodsByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>TheAudioDb.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[discogsource]" output="<chain function="GetTADBDiscographyByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>TheAudioDb.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[lifespansource]" output="<chain function="GetTADBLifeSpanByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>TheAudioDb.com</expression>
|
||
|
</RegExp>
|
||
|
<expression noclean="1"/>
|
||
|
</RegExp>
|
||
|
</GetArtistDetails>
|
||
|
|
||
|
<GetAMGData dest="5" clearbuffers="no">
|
||
|
<RegExp input="$$2" output="<details>\1</details>" dest="5">
|
||
|
<RegExp input="$$1" output="\1" dest="9">
|
||
|
<expression/>
|
||
|
</RegExp>
|
||
|
<RegExp input="" output="" dest="2">
|
||
|
<expression />
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[discogsource]" output="<chain function="GetAMGDiscographyByAMGID">$$9</chain>" dest="2">
|
||
|
<expression>allmusic.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[lifespansource]" output="<chain function="GetAMGArtistLifeSpanByAMGID">$$9</chain>" dest="2+">
|
||
|
<expression>allmusic.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[biogsource]" output="<chain function="GetAMGBiographyByAMGID">$$9</chain>" dest="2+">
|
||
|
<expression>allmusic.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[genressource]" output="<chain function="GetAMGArtistGenresByAMGID">$$9</chain>" dest="2+">
|
||
|
<expression>allmusic.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[stylessource]" output="<chain function="GetAMGArtistStylesByAMGID">$$9</chain>" dest="2+">
|
||
|
<expression>allmusic.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[moodssource]" output="<chain function="GetAMGArtistMoodsByAMGID">$$9</chain>" dest="2+">
|
||
|
<expression>allmusic.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[yearsasource]" output="<chain function="GetAMGArtistYearsActiveByAMGID">$$9</chain>" dest="2+">
|
||
|
<expression>allmusic.com</expression>
|
||
|
</RegExp>
|
||
|
<expression noclean="1" />
|
||
|
</RegExp>
|
||
|
</GetAMGData>
|
||
|
|
||
|
<AMGFallback dest="5" clearbuffers="no">
|
||
|
<RegExp input="$$11" output="<details>\1</details>" dest="5">
|
||
|
<RegExp input="$INFO[discogfbsource]" output="<chain function="GetMBDiscographyByMBID">$$8</chain>" dest="11+">
|
||
|
<expression>MusicBrainz</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[lifespanfbsource]" output="<chain function="GetMBLafeSpanByMBID">$$8</chain>" dest="11+">
|
||
|
<expression>MusicBrainz</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[stylesfbsource]" output="<chain function="GetTADBArtistStylesByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>TheAudioDb.com</expression>
|
||
|
</RegExp>
|
||
|
<RegExp input="$INFO[moodsfbsource]" output="<chain function="GetTADBArtistMoodsByMBID">$$8</chain>" dest="5+">
|
||
|
<expression>TheAudioDb.com</expression>
|
||
|
</RegExp>
|
||
|
<expression noclean="1" />
|
||
|
</RegExp>
|
||
|
</AMGFallback>
|
||
|
|
||
|
</scraper>
|