Remove ComicSherpa

This legacy site has already been offline for a few weeks now and
is probably not coming back.
This commit is contained in:
Tobias Gruetzmacher 2021-04-02 09:28:56 +02:00
parent 6436bc0c6a
commit 2c8bb90d4e
3 changed files with 249 additions and 322 deletions

View file

@ -1,211 +0,0 @@
# SPDX-License-Identifier: MIT
# Copyright (C) 2004-2008 Tristan Seligmann and Jonathan Jacobs
# Copyright (C) 2012-2014 Bastian Kleineidam
# Copyright (C) 2015-2020 Tobias Gruetzmacher
from ..scraper import _ParserScraper
class ComicSherpa(_ParserScraper):
url = 'http://www.comicssherpa.com/site/'
imageSearch = '//img[contains(@src, "/comics/")]'
prevSearch = '//a[text()="previous day"]'
help = 'Index format: yyyymmdd'
def __init__(self, name, path):
super(ComicSherpa, self).__init__('ComicSherpa/' + name)
self.session.add_throttle('www.comicssherpa.com', 1.0, 2.0)
self.url = 'http://www.comicssherpa.com/site/feature?uc_comic=' + path
def getIndexStripUrl(self, index):
return self.url + '&uc_full_date=%s' % index
@classmethod
def getmodules(cls): # noqa: Allowed to be long
return (
# do not edit anything below since these entries are generated from
# scripts/comicsherpa.py
# START AUTOUPDATE
cls('060', 'csadl'),
cls('AaronGuile', 'csdsf'),
cls('ABCStreet', 'csmbx'),
cls('ABitSketch', 'csxmy'),
cls('ABomb', 'csvur'),
cls('ACMEINKD', 'csmwt'),
cls('AcornPark', 'csdfe'),
cls('Adulting', 'cskky'),
cls('AllInGoodTime', 'csjhr'),
cls('AmandaTheGreat', 'cssyr'),
cls('AndNow', 'csnxr'),
cls('Anecdote', 'cspmf'),
cls('AnimalMitchell', 'csdnm'),
cls('AnneAndPythagoras', 'csokq'),
cls('AppleCreekComics', 'cstgq'),
cls('ATasteOfTimes', 'csprn'),
cls('BatchRejection', 'csgny'),
cls('Bazoobee', 'csfos'),
cls('BeMisery', 'csiiq'),
cls('BigJim', 'csiao'),
cls('Bluebonnets', 'cston'),
cls('BlueSkiesToons', 'csfoy'),
cls('BobsYourUncle', 'csmxz'),
cls('BoltsAndNuts', 'csnab'),
cls('Bork', 'csczn'),
cls('BottAuto', 'csmwz'),
cls('BUNS', 'csbft'),
cls('Bushscrubs', 'csmzx'),
cls('CAFFEINATED', 'csbmv'),
cls('CandacenCompany', 'csvpd'),
cls('CarteBlanche', 'csnwk'),
cls('CharmysArmy', 'cswrl'),
cls('Complex', 'csusy'),
cls('CourageousManAdventures', 'csgkn'),
cls('DadsDay', 'cswly'),
cls('DBCartoons', 'csnvt'),
cls('DoghouseInYourSoul', 'cstwx'),
cls('DoingTime', 'csvuk'),
cls('DontPickTheFlowers', 'cswfs'),
cls('Dragin', 'cswgz'),
cls('DumbQuestionBadAnswer', 'cskro'),
cls('DungeonHordes', 'csnlo'),
cls('DustSpecks', 'csqgq'),
cls('DutchnPals', 'cskqc'),
cls('Econogirl', 'csxoj'),
cls('EightballEyeball', 'csnfh'),
cls('Elmo', 'csvff'),
cls('Endangered', 'cshii'),
cls('FamousAndNotSoFamousQuotes', 'csdgz'),
cls('FarOut', 'csaem'),
cls('FatherOfTheBrood', 'csuul'),
cls('FoxTheCat', 'csxbc'),
cls('FrankAndSteinway', 'cseui'),
cls('FriedCritter', 'cshtp'),
cls('GarciaCartoonCo', 'csyuw'),
cls('GIRTH', 'csbjw'),
cls('GrandmaSnoops', 'csscq'),
cls('GrannyAnny', 'cskpg'),
cls('GreenPieces', 'csnwy'),
cls('GunstonStreet', 'csgru'),
cls('HallEditorialCartoons', 'csgzx'),
cls('HaphazardHumor', 'cspsa'),
cls('Headcheese', 'cspku'),
cls('Hogwashed', 'csbnf'),
cls('HomeLife', 'csrbv'),
cls('Hubbel', 'cszrr'),
cls('HugoComics', 'csdwl'),
cls('HurrieTheMisManager', 'cssri'),
cls('HuskyTales', 'cslnp'),
cls('InkwellForest', 'csmuk'),
cls('IronyOr', 'csddz'),
cls('ItsJustJim', 'cszos'),
cls('JolleyStuffBrowser', 'csjpq'),
cls('KALEECHIKORNERS', 'cshdw'),
cls('KartoonsByKline', 'csoei'),
cls('LaffToons', 'cssvj'),
cls('LiliAndDerek', 'csvsy'),
cls('LilleysSillies', 'cstka'),
cls('LimboRoad', 'csfpp'),
cls('LumAndAbner', 'cscji'),
cls('MarysNature', 'csogt'),
cls('Millennialville', 'csxrl'),
cls('Milton50', 'csmof'),
cls('Mindframe', 'csqnp'),
cls('Minihahas', 'csoat'),
cls('MiscSoup', 'csguq'),
cls('MisterAndMe', 'csvhr'),
cls('MockAll', 'csrds'),
cls('Moments', 'csnso'),
cls('Mongrels', 'csbjo'),
cls('MortsIsland', 'csfyq'),
cls('MySonIsADog', 'csfec'),
cls('NoAmbiguity', 'csryw'),
cls('NoBusinessIKnow', 'csmfg'),
cls('NoOrdinaryLife', 'csicr'),
cls('Npchumorcom', 'csbuv'),
cls('OneFunnyGoldenRetriever', 'csnrf'),
cls('ONIONAndPEA', 'cstsr'),
cls('OscarAndAnnie', 'csczw'),
cls('OverQuirked', 'cspes'),
cls('PaddedCell', 'csxqk'),
cls('Painterly', 'csuya'),
cls('PalAndBuddy', 'csjut'),
cls('PawsForThoughtComics', 'csced'),
cls('Peeples', 'csnkd'),
cls('PeopleOfEarth', 'csjqa'),
cls('PicpakDog', 'cstmm'),
cls('PirateMike', 'csxcb'),
cls('PoliceLimit', 'cspcc'),
cls('PoliticularJokesAndRuffus', 'csmvz'),
cls('Prideland', 'csaoa'),
cls('PrimusTheBadPhilosopher', 'csofd'),
cls('ProfessorHerbertAndGEO', 'cscje'),
cls('QueenBlackbeard', 'csecq'),
cls('QuickDraw', 'csydp'),
cls('RandysRationale', 'cshsw'),
cls('Ringers', 'csxhx'),
cls('RonWarren', 'csuwd'),
cls('SandSharkBeach', 'cssqk'),
cls('SharpCurveComics', 'csyek'),
cls('SherpaAid', 'csvku'),
cls('SignGarden', 'csbxu'),
cls('SignsOfAFrustratedGolfer', 'csxdy'),
cls('Skull', 'csdxo'),
cls('Skylarking', 'csyac'),
cls('SleepytownBeagles', 'cssbk'),
cls('SmallNerdyCreatures', 'cshqb'),
cls('Smith', 'csmdx'),
cls('Snootle', 'cseic'),
cls('SoccerDude', 'csnnb'),
cls('SoccerEarth', 'csdma'),
cls('SOD', 'cszdh'),
cls('SomethingAboutCeleste', 'csgtv'),
cls('SookyRottweiler', 'csegu'),
cls('Spaceport51', 'csbyh'),
cls('SportsByVoort', 'cskin'),
cls('StaleCrackers', 'csngu'),
cls('StankoAndTibor', 'csurl'),
cls('Strangeville', 'cskps'),
cls('SubSub', 'csvcv'),
cls('SuburbanFairyTales', 'cscek'),
cls('SUITSANDGUARDERS', 'cssag'),
cls('SuperSiblings', 'csdxj'),
cls('TheBeauforts', 'csfxu'),
cls('TheBellies', 'csubt'),
cls('TheBoobiehatch', 'csoev'),
cls('TheCardinal', 'csfjg'),
cls('TheDinkledorfs', 'cszhp'),
cls('TheFabulousBushPigs', 'cscqi'),
cls('TheGrayZone', 'csmue'),
cls('TheGreenMonkeys', 'cscue'),
cls('TheMagicForest', 'csjts'),
cls('TheMothManAndLarvaeBoy', 'csycu'),
cls('TheMountainMen', 'cskqw'),
cls('TheNeighborhood', 'csrtu'),
cls('TheNevilleYouKnow', 'csnov'),
cls('TheNonsenseNewz', 'csghu'),
cls('TheOldManAndHisDog', 'csudu'),
cls('TheQuinnAndFinnShow', 'csynn'),
cls('TheRocks', 'cswky'),
cls('TheUnemployed', 'csanx'),
cls('Thingsesque', 'cstsq'),
cls('TodaysTrump', 'csbrj'),
cls('TopicToons', 'csgly'),
cls('ToughTown', 'csnjp'),
cls('ToxicValues', 'csyig'),
cls('TruthBeKnown', 'csfwi'),
cls('TuesdaysWithCory', 'csiea'),
cls('Underdone', 'csayl'),
cls('UnMannerlyWays', 'csjmh'),
cls('ViewFromTheCouch', 'csipm'),
cls('VoicesInTheDark', 'csyou'),
cls('WarpedAndDemented', 'csbgw'),
cls('Waskataskahiskewaskewan', 'cssfg'),
cls('WayOutComics', 'cstrs'),
cls('WeaselInk', 'csfsn'),
cls('WhiskeyFalls', 'csitw'),
cls('Windsock', 'csywy'),
cls('WrobbertCartoons', 'csupg'),
cls('YinYangster', 'csteo'),
cls('ZombieHeights', 'cswjq'),
cls('Zootopia', 'csquz'),
# END AUTOUPDATE
)

View file

@ -629,71 +629,320 @@ class Removed(Scraper):
cls('ComicFury/TheUnthinkableHybrid'),
cls('ComicFury/TwentyFourSeven'),
cls('ComicFury/TwentyFourSevenFans'),
cls('ComicSherpa/060'),
cls('ComicSherpa/AaronGuile'),
cls('ComicSherpa/ABCStreet'),
cls('ComicSherpa/ABitSketch'),
cls('ComicSherpa/ABomb'),
cls('ComicSherpa/ACMEINKD'),
cls('ComicSherpa/AcornPark'),
cls('ComicSherpa/Adulting'),
cls('ComicSherpa/AllInGoodTime'),
cls('ComicSherpa/AmandaTheGreat'),
cls('ComicSherpa/AndNow'),
cls('ComicSherpa/Anecdote'),
cls('ComicSherpa/AnimalMitchell'),
cls('ComicSherpa/AnneAndPythagoras'),
cls('ComicSherpa/AppleCreekComics'),
cls('ComicSherpa/ATasteOfTimes'),
cls('ComicSherpa/BatchRejection'),
cls('ComicSherpa/Bazoobee'),
cls('ComicSherpa/BeMisery'),
cls('ComicSherpa/BigJim'),
cls('ComicSherpa/Bluebonnets'),
cls('ComicSherpa/BlueSkiesToons'),
cls('ComicSherpa/BobsYourUncle'),
cls('ComicSherpa/BoltsAndNuts'),
cls('ComicSherpa/Bork'),
cls('ComicSherpa/BottAuto'),
cls('ComicSherpa/BUNS'),
cls('ComicSherpa/Bushscrubs'),
cls('ComicSherpa/CAFFEINATED'),
cls('ComicSherpa/CandacenCompany'),
cls('ComicSherpa/CarteBlanche'),
cls('ComicSherpa/CharmysArmy'),
cls('ComicSherpa/Complex'),
cls('ComicSherpa/CourageousManAdventures'),
cls('ComicSherpa/DadsDay'),
cls('ComicSherpa/DBCartoons'),
cls('ComicSherpa/DoghouseInYourSoul'),
cls('ComicSherpa/DoingTime'),
cls('ComicSherpa/DontPickTheFlowers'),
cls('ComicSherpa/Dragin'),
cls('ComicSherpa/DumbQuestionBadAnswer'),
cls('ComicSherpa/DungeonHordes'),
cls('ComicSherpa/DustSpecks'),
cls('ComicSherpa/DutchnPals'),
cls('ComicSherpa/Econogirl'),
cls('ComicSherpa/EightballEyeball'),
cls('ComicSherpa/Elmo'),
cls('ComicSherpa/Endangered'),
cls('ComicSherpa/FamousAndNotSoFamousQuotes'),
cls('ComicSherpa/FarOut'),
cls('ComicSherpa/FatherOfTheBrood'),
cls('ComicSherpa/FoxTheCat'),
cls('ComicSherpa/FrankAndSteinway'),
cls('ComicSherpa/FriedCritter'),
cls('ComicSherpa/GarciaCartoonCo'),
cls('ComicSherpa/GIRTH'),
cls('ComicSherpa/GrandmaSnoops'),
cls('ComicSherpa/GrannyAnny'),
cls('ComicSherpa/GreenPieces'),
cls('ComicSherpa/GunstonStreet'),
cls('ComicSherpa/HallEditorialCartoons'),
cls('ComicSherpa/HaphazardHumor'),
cls('ComicSherpa/Headcheese'),
cls('ComicSherpa/Hogwashed'),
cls('ComicSherpa/HomeLife'),
cls('ComicSherpa/Hubbel'),
cls('ComicSherpa/HugoComics'),
cls('ComicSherpa/HurrieTheMisManager'),
cls('ComicSherpa/HuskyTales'),
cls('ComicSherpa/InkwellForest'),
cls('ComicSherpa/IronyOr'),
cls('ComicSherpa/ItsJustJim'),
cls('ComicSherpa/JolleyStuffBrowser'),
cls('ComicSherpa/KALEECHIKORNERS'),
cls('ComicSherpa/KartoonsByKline'),
cls('ComicSherpa/LaffToons'),
cls('ComicSherpa/LiliAndDerek'),
cls('ComicSherpa/LilleysSillies'),
cls('ComicSherpa/LimboRoad'),
cls('ComicSherpa/LumAndAbner'),
cls('ComicSherpa/MarysNature'),
cls('ComicSherpa/Millennialville'),
cls('ComicSherpa/Milton50'),
cls('ComicSherpa/Mindframe'),
cls('ComicSherpa/Minihahas'),
cls('ComicSherpa/MiscSoup'),
cls('ComicSherpa/MisterAndMe'),
cls('ComicSherpa/MockAll'),
cls('ComicSherpa/Moments'),
cls('ComicSherpa/Mongrels'),
cls('ComicSherpa/MortsIsland'),
cls('ComicSherpa/MySonIsADog'),
cls('ComicSherpa/NoAmbiguity'),
cls('ComicSherpa/NoBusinessIKnow'),
cls('ComicSherpa/NoOrdinaryLife'),
cls('ComicSherpa/Npchumorcom'),
cls('ComicSherpa/OneFunnyGoldenRetriever'),
cls('ComicSherpa/ONIONAndPEA'),
cls('ComicSherpa/OscarAndAnnie'),
cls('ComicSherpa/OverQuirked'),
cls('ComicSherpa/PaddedCell'),
cls('ComicSherpa/Painterly'),
cls('ComicSherpa/PalAndBuddy'),
cls('ComicSherpa/PawsForThoughtComics'),
cls('ComicSherpa/Peeples'),
cls('ComicSherpa/PeopleOfEarth'),
cls('ComicSherpa/PicpakDog'),
cls('ComicSherpa/PirateMike'),
cls('ComicSherpa/PoliceLimit'),
cls('ComicSherpa/PoliticularJokesAndRuffus'),
cls('ComicSherpa/Prideland'),
cls('ComicSherpa/PrimusTheBadPhilosopher'),
cls('ComicSherpa/ProfessorHerbertAndGEO'),
cls('ComicSherpa/QueenBlackbeard'),
cls('ComicSherpa/QuickDraw'),
cls('ComicSherpa/RandysRationale'),
cls('ComicSherpa/Ringers'),
cls('ComicSherpa/RonWarren'),
cls('ComicSherpa/SandSharkBeach'),
cls('ComicSherpa/SharpCurveComics'),
cls('ComicSherpa/SherpaAid'),
cls('ComicSherpa/SignGarden'),
cls('ComicSherpa/SignsOfAFrustratedGolfer'),
cls('ComicSherpa/Skull'),
cls('ComicSherpa/Skylarking'),
cls('ComicSherpa/SleepytownBeagles'),
cls('ComicSherpa/SmallNerdyCreatures'),
cls('ComicSherpa/Smith'),
cls('ComicSherpa/Snootle'),
cls('ComicSherpa/SoccerDude'),
cls('ComicSherpa/SoccerEarth'),
cls('ComicSherpa/SOD'),
cls('ComicSherpa/SomethingAboutCeleste'),
cls('ComicSherpa/SookyRottweiler'),
cls('ComicSherpa/Spaceport51'),
cls('ComicSherpa/SportsByVoort'),
cls('ComicSherpa/StaleCrackers'),
cls('ComicSherpa/StankoAndTibor'),
cls('ComicSherpa/Strangeville'),
cls('ComicSherpa/SubSub'),
cls('ComicSherpa/SuburbanFairyTales'),
cls('ComicSherpa/SUITSANDGUARDERS'),
cls('ComicSherpa/SuperSiblings'),
cls('ComicSherpa/TheBeauforts'),
cls('ComicSherpa/TheBellies'),
cls('ComicSherpa/TheBoobiehatch'),
cls('ComicSherpa/TheCardinal'),
cls('ComicSherpa/TheDinkledorfs'),
cls('ComicSherpa/TheFabulousBushPigs'),
cls('ComicSherpa/TheGrayZone'),
cls('ComicSherpa/TheGreenMonkeys'),
cls('ComicSherpa/TheMagicForest'),
cls('ComicSherpa/TheMothManAndLarvaeBoy'),
cls('ComicSherpa/TheMountainMen'),
cls('ComicSherpa/TheNeighborhood'),
cls('ComicSherpa/TheNevilleYouKnow'),
cls('ComicSherpa/TheNonsenseNewz'),
cls('ComicSherpa/TheOldManAndHisDog'),
cls('ComicSherpa/TheQuinnAndFinnShow'),
cls('ComicSherpa/TheRocks'),
cls('ComicSherpa/TheUnemployed'),
cls('ComicSherpa/Thingsesque'),
cls('ComicSherpa/TodaysTrump'),
cls('ComicSherpa/TopicToons'),
cls('ComicSherpa/ToughTown'),
cls('ComicSherpa/ToxicValues'),
cls('ComicSherpa/TruthBeKnown'),
cls('ComicSherpa/TuesdaysWithCory'),
cls('ComicSherpa/Underdone'),
cls('ComicSherpa/UnMannerlyWays'),
cls('ComicSherpa/ViewFromTheCouch'),
cls('ComicSherpa/VoicesInTheDark'),
cls('ComicSherpa/WarpedAndDemented'),
cls('ComicSherpa/Waskataskahiskewaskewan'),
cls('ComicSherpa/WayOutComics'),
cls('ComicSherpa/WeaselInk'),
cls('ComicSherpa/WhiskeyFalls'),
cls('ComicSherpa/Windsock'),
cls('ComicSherpa/WrobbertCartoons'),
cls('ComicSherpa/YinYangster'),
cls('ComicSherpa/ZombieHeights'),
cls('ComicSherpa/Zootopia'),
cls('GoComics/060'),
cls('GoComics/2CowsAndAChicken'),
cls('GoComics/ABitSketch'),
cls('GoComics/Andnow'),
cls('GoComics/Anecdote'),
cls('GoComics/AppleCreekComics'),
cls('GoComics/AskAPortlySyndicatePerson'),
cls('GoComics/BarkingCrayon'),
cls('GoComics/Bazoobee'),
cls('GoComics/Bewley'),
cls('GoComics/Biographic'),
cls('GoComics/Bluebonnets'),
cls('GoComics/BlueSkiesToons'),
cls('GoComics/BottAuto'),
cls('GoComics/BrainSquirts'),
cls('GoComics/BUNS'),
cls('GoComics/CAFFEINATED'),
cls('GoComics/CapsulasMedicas'),
cls('GoComics/CharmysArmy'),
cls('GoComics/ClearBlueWater'),
cls('GoComics/Committed'),
cls('GoComics/ConnieToTheWonnie'),
cls('GoComics/CourageousManAdventures'),
cls('GoComics/DontPicktheFlowers'),
cls('GoComics/DorrisMcComics'),
cls('GoComics/Dragin'),
cls('GoComics/DragonGirl'),
cls('GoComics/Drive'),
cls('GoComics/DudeAndDude'),
cls('GoComics/DumbQuestionBadAnswer'),
cls('GoComics/DustSpecks'),
cls('GoComics/Econogirl'),
cls('GoComics/EdgeOfAdventure'),
cls('GoComics/Elmo'),
cls('GoComics/EricTheCircle'),
cls('GoComics/FacesOfTheNewsByKerryWaghorn'),
cls('GoComics/FarOut'),
cls('GoComics/FortKnox'),
cls('GoComics/FrankAndSteinway'),
cls('GoComics/FriedCritter'),
cls('GoComics/GarciaCartoonCo'),
cls('GoComics/GarfieldMinusGarfield'),
cls('GoComics/GIRTH'),
cls('GoComics/GoComicsFanArt'),
cls('GoComics/Graffiti'),
cls('GoComics/GrannyAnny'),
cls('GoComics/GreenPieces'),
cls('GoComics/GunstonStreet'),
cls('GoComics/HaikuEwe'),
cls('GoComics/Headcheese'),
cls('GoComics/HealthCapsules'),
cls('GoComics/HowToCat'),
cls('GoComics/HumanCull'),
cls('GoComics/ItsjustJim'),
cls('GoComics/JerryHolbert'),
cls('GoComics/JillpokeBohemia'),
cls('GoComics/JustSayUncle'),
cls('GoComics/KartoonsByKline'),
cls('GoComics/KidSpot'),
cls('GoComics/KidTown'),
cls('GoComics/KitNCarlyle'),
cls('GoComics/LostSideOfSuburbia'),
cls('GoComics/LumandAbner'),
cls('GoComics/MagicInAMinute'),
cls('GoComics/MazeToonsPuzzle'),
cls('GoComics/MegClassics'),
cls('GoComics/MichaelAndrew'),
cls('GoComics/Microcosm'),
cls('GoComics/Millennialville'),
cls('GoComics/Milton50'),
cls('GoComics/Mindframe'),
cls('GoComics/MiscSoup'),
cls('GoComics/MisterAndMe'),
cls('GoComics/MortsIsland'),
cls('GoComics/MyCage'),
cls('GoComics/MyCageNewAndOld'),
cls('GoComics/NoOrdinaryLife'),
cls('GoComics/ONIONAndPEA'),
cls('GoComics/PaddedCell'),
cls('GoComics/PaulSzep'),
cls('GoComics/Peeples'),
cls('GoComics/PicturesInBoxes'),
cls('GoComics/PieComic'),
cls('GoComics/Pinkerton'),
cls('GoComics/PoliceLimit'),
cls('GoComics/PopCultureShockTherapy'),
cls('GoComics/ReplyAll'),
cls('GoComics/ReplyAllLite'),
cls('GoComics/RonWarren'),
cls('GoComics/Sheldon'),
cls('GoComics/Shoecabbage'),
cls('GoComics/Shortcuts'),
cls('GoComics/ShutterbugFollies'),
cls('GoComics/SignGarden'),
cls('GoComics/SleepytownBeagles'),
cls('GoComics/SmallNerdyCreatures'),
cls('GoComics/Smith'),
cls('GoComics/SoccerEarth'),
cls('GoComics/SookyRottweiler'),
cls('GoComics/Speechless'),
cls('GoComics/SportsbyVoort'),
cls('GoComics/StankoAndTibor'),
cls('GoComics/SubSub'),
cls('GoComics/SuburbanFairyTales'),
cls('GoComics/SuperSiblings'),
cls('GoComics/ThatsLife'),
cls('GoComics/TheBeauforts'),
cls('GoComics/TheBentPinky'),
cls('GoComics/TheBestMedicineCartoon'),
cls('GoComics/TheBoobiehatch'),
cls('GoComics/TheCardinal'),
cls('GoComics/TheConjurers'),
cls('GoComics/TheCreeps'),
cls('GoComics/TheGentlemansArmchair'),
cls('GoComics/TheGreenMonkeys'),
cls('GoComics/TheLostBear'),
cls('GoComics/TheNorm40'),
cls('GoComics/TheOldManAndHisDog'),
cls('GoComics/TheQuinnAndFinnShow'),
cls('GoComics/TheQuixoteSyndrome'),
cls('GoComics/TheSunshineClub'),
cls('GoComics/Thingsesque'),
cls('GoComics/TimEagan'),
cls('GoComics/TOBY'),
cls('GoComics/UncleArtsFunland'),
cls('GoComics/USAcres'),
cls('GoComics/WayOutComics'),
cls('GoComics/WhiskeyFalls'),
cls('GoComics/WhyattCartoons'),
cls('GoComics/WorldOfWonder'),
cls('GoComics/Wrobbertcartoons'),
cls('GoComics/Zootopia'),
cls('JustAnotherEscape'),
cls('Laiyu', 'brk'),
cls('MangaDex/DrStone', 'legal'),
@ -1314,73 +1563,6 @@ class Renamed(Scraper):
cls('DarkWings', 'Eryl'),
cls('EyeOfRamalach', 'KemonoCafe/TheEyeOfRamalach'),
cls('FoulLanguage', 'GoComics/FowlLanguage'),
cls('GoComics/060', 'ComicSherpa/060'),
cls('GoComics/ABitSketch', 'ComicSherpa/ABitSketch'),
cls('GoComics/Andnow', 'ComicSherpa/AndNow'),
cls('GoComics/Anecdote', 'ComicSherpa/Anecdote'),
cls('GoComics/AppleCreekComics', 'ComicSherpa/AppleCreekComics'),
cls('GoComics/BarkingCrayon', 'ComicFury/BarkingCrayon'),
cls('GoComics/Bazoobee', 'ComicSherpa/Bazoobee'),
cls('GoComics/Bluebonnets', 'ComicSherpa/Bluebonnets'),
cls('GoComics/BlueSkiesToons', 'ComicSherpa/BlueSkiesToons'),
cls('GoComics/BottAuto', 'ComicSherpa/BottAuto'),
cls('GoComics/BUNS', 'ComicSherpa/BUNS'),
cls('GoComics/CAFFEINATED', 'ComicSherpa/CAFFEINATED'),
cls('GoComics/CharmysArmy', 'ComicSherpa/CharmysArmy'),
cls('GoComics/CourageousManAdventures', 'ComicSherpa/CourageousManAdventures'),
cls('GoComics/DontPicktheFlowers', 'ComicSherpa/DontPickTheFlowers'),
cls('GoComics/Dragin', 'ComicSherpa/Dragin'),
cls('GoComics/DumbQuestionBadAnswer', 'ComicSherpa/DumbQuestionBadAnswer'),
cls('GoComics/DustSpecks', 'ComicSherpa/DustSpecks'),
cls('GoComics/Econogirl', 'ComicSherpa/Econogirl'),
cls('GoComics/Elmo', 'ComicSherpa/Elmo'),
cls('GoComics/FarOut', 'ComicSherpa/FarOut'),
cls('GoComics/FrankAndSteinway', 'ComicSherpa/FrankAndSteinway'),
cls('GoComics/FriedCritter', 'ComicSherpa/FriedCritter'),
cls('GoComics/GarciaCartoonCo', 'ComicSherpa/GarciaCartoonCo'),
cls('GoComics/GIRTH', 'ComicSherpa/GIRTH'),
cls('GoComics/GrannyAnny', 'ComicSherpa/GrannyAnny'),
cls('GoComics/GreenPieces', 'ComicSherpa/GreenPieces'),
cls('GoComics/GunstonStreet', 'ComicSherpa/GunstonStreet'),
cls('GoComics/Headcheese', 'ComicSherpa/Headcheese'),
cls('GoComics/ItsjustJim', 'ComicSherpa/ItsJustJim'),
cls('GoComics/JillpokeBohemia', 'ComicFury/JillpokeBohemia'),
cls('GoComics/KartoonsByKline', 'ComicSherpa/KartoonsByKline'),
cls('GoComics/LumandAbner', 'ComicSherpa/LumAndAbner'),
cls('GoComics/Millennialville', 'ComicSherpa/Millennialville'),
cls('GoComics/Milton50', 'ComicSherpa/Milton50'),
cls('GoComics/Mindframe', 'ComicSherpa/Mindframe'),
cls('GoComics/MiscSoup', 'ComicSherpa/MiscSoup'),
cls('GoComics/MisterAndMe', 'ComicSherpa/MisterAndMe'),
cls('GoComics/MortsIsland', 'ComicSherpa/MortsIsland'),
cls('GoComics/NoOrdinaryLife', 'ComicSherpa/NoOrdinaryLife'),
cls('GoComics/ONIONAndPEA', 'ComicSherpa/ONIONAndPEA'),
cls('GoComics/PaddedCell', 'ComicSherpa/PaddedCell'),
cls('GoComics/Peeples', 'ComicSherpa/Peeples'),
cls('GoComics/PoliceLimit', 'ComicSherpa/PoliceLimit'),
cls('GoComics/RonWarren', 'ComicSherpa/RonWarren'),
cls('GoComics/SignGarden', 'ComicSherpa/SignGarden'),
cls('GoComics/SleepytownBeagles', 'ComicSherpa/SleepytownBeagles'),
cls('GoComics/SmallNerdyCreatures', 'ComicSherpa/SmallNerdyCreatures'),
cls('GoComics/Smith', 'ComicSherpa/Smith'),
cls('GoComics/SoccerEarth', 'ComicSherpa/SoccerEarth'),
cls('GoComics/SookyRottweiler', 'ComicSherpa/SookyRottweiler'),
cls('GoComics/SportsbyVoort', 'ComicSherpa/SportsByVoort'),
cls('GoComics/StankoAndTibor', 'ComicSherpa/StankoAndTibor'),
cls('GoComics/SubSub', 'ComicSherpa/SubSub'),
cls('GoComics/SuburbanFairyTales', 'ComicSherpa/SuburbanFairyTales'),
cls('GoComics/SuperSiblings', 'ComicSherpa/SuperSiblings'),
cls('GoComics/TheBeauforts', 'ComicSherpa/TheBeauforts'),
cls('GoComics/TheBoobiehatch', 'ComicSherpa/TheBoobiehatch'),
cls('GoComics/TheCardinal', 'ComicSherpa/TheCardinal'),
cls('GoComics/TheGreenMonkeys', 'ComicSherpa/TheGreenMonkeys'),
cls('GoComics/TheOldManAndHisDog', 'ComicSherpa/TheOldManAndHisDog'),
cls('GoComics/TheQuinnAndFinnShow', 'ComicSherpa/TheQuinnAndFinnShow'),
cls('GoComics/Thingsesque', 'ComicSherpa/Thingsesque'),
cls('GoComics/WayOutComics', 'ComicSherpa/WayOutComics'),
cls('GoComics/WhiskeyFalls', 'ComicSherpa/WhiskeyFalls'),
cls('GoComics/Wrobbertcartoons', 'ComicSherpa/WrobbertCartoons'),
cls('GoComics/Zootopia', 'ComicSherpa/Zootopia'),
cls('KeenSpot/AntiheroForHire', 'AntiheroForHire'),
cls('KeenSpot/ElGoonishShive', 'ElGoonishShive'),
cls('KeenSpot/ElGoonishShiveNP', 'ElGoonishShiveNP'),

View file

@ -1,44 +0,0 @@
#!/usr/bin/env python3
# SPDX-License-Identifier: MIT
# Copyright (C) 2004-2008 Tristan Seligmann and Jonathan Jacobs
# Copyright (C) 2012-2014 Bastian Kleineidam
# Copyright (C) 2015-2017 Tobias Gruetzmacher
"""
Script to get a list of ComicSherpa and save the info in a JSON file for
further processing.
"""
from scriptutil import ComicListUpdater
class ComicSherpaUpdater(ComicListUpdater):
# names of comics to exclude
excluded_comics = (
# missing images
'Pi',
'Rufus',
# too short
'BeneathTheFerns',
'BillyAndCo',
'BuffaloChips',
'Crawdiddy',
'Gravy',
'NewFeature',
)
def collect_results(self):
"""Parse all listing pages."""
data = self.get_url('http://www.comicssherpa.com/site/home.html', expand=False)
for comiclink in data.xpath('//a[contains(@href, "site/feature")]'):
link = comiclink.attrib['href'].split('=')[1]
name = comiclink.text
self.add_comic(name, link)
def get_entry(self, name, url):
return u"cls('%s', '%s')," % (name, url)
if __name__ == '__main__':
ComicSherpaUpdater(__file__).run()