Merge pull request #254 from Southparkfan/master

Add Miraheze wiki farm
pull/262/head
nemobis 9 years ago
commit b2d3239027

@ -0,0 +1,34 @@
#!/usr/bin/env python2
# -*- coding: utf-8 -*-
# Copyright (C) 2014 WikiTeam developers
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
import re
import requests
def main():
headers = {
'User-Agent': 'Mozilla/5.0 (X11; Linux i686; rv:24.0) Gecko/20100101 Firefox/24.0',
}
url = 'https://meta.miraheze.org/wiki/Special:SiteMatrix'
r = requests.get(url, headers=headers)
raw = r.text
m = re.findall(ur'<tr><td><a href="https://([^>]+?)/">[^<]+</a></td></tr>', raw)
for i in m:
print 'https://' + i + '/w/api.php'
if __name__ == '__main__':
main()

@ -0,0 +1,53 @@
https://8station.miraheze.org/w/api.php
https://advancedazrielangel.miraheze.org/w/api.php
https://allthetropes.miraheze.org/w/api.php
https://allthetropestest.miraheze.org/w/api.php
https://antiguabarbudacalypso.com/w/api.php
https://anuwiki.com/w/api.php
https://bitcoindebates.miraheze.org/w/api.php
https://bus.miraheze.org/w/api.php
https://camerainfo.miraheze.org/w/api.php
https://castironcook.miraheze.org/w/api.php
https://catbox.miraheze.org/w/api.php
https://civicv.miraheze.org/w/api.php
https://clicordi.miraheze.org/w/api.php
https://creed.miraheze.org/w/api.php
https://creersonarbre.miraheze.org/w/api.php
https://degu.miraheze.org/w/api.php
https://dp.miraheze.org/w/api.php
https://drunkenpeasants.miraheze.org/w/api.php
https://fieldresearch.miraheze.org/w/api.php
https://gen.miraheze.org/w/api.php
https://gibs.miraheze.org/w/api.php
https://gumedien.miraheze.org/w/api.php
https://imedrones.miraheze.org/w/api.php
https://interwiki.miraheze.org/w/api.php
https://izanagi.miraheze.org/w/api.php
https://jumpingjimny.miraheze.org/w/api.php
https://lastpodcast.miraheze.org/w/api.php
https://linux.miraheze.org/w/api.php
https://login.miraheze.org/w/api.php
https://mafia.miraheze.org/w/api.php
https://meta.miraheze.org/w/api.php
https://micropedia.miraheze.org/w/api.php
https://mot94.miraheze.org/w/api.php
https://permanentfuturelab.wiki/w/api.php
https://poserdazfreebies.miraheze.org/w/api.php
https://printmakingbe.miraheze.org/w/api.php
https://pxgproject.miraheze.org/w/api.php
https://quantix.miraheze.org/w/api.php
https://rawdata.miraheze.org/w/api.php
https://recherchesdocumentaires.miraheze.org/w/api.php
https://safiria.miraheze.org/w/api.php
https://southparkfan.miraheze.org/w/api.php
https://spiral.wiki/w/api.php
https://spiraltest.miraheze.org/w/api.php
https://tanods.miraheze.org/w/api.php
https://test.miraheze.org/w/api.php
https://theestablishmentmap.miraheze.org/w/api.php
https://tyrolmountains.miraheze.org/w/api.php
https://undisconnect.miraheze.org/w/api.php
https://unna.miraheze.org/w/api.php
https://welcomewiki.miraheze.org/w/api.php
https://wikiolimpica.miraheze.org/w/api.php
https://witsacademy.miraheze.org/w/api.php

@ -0,0 +1,8 @@
Wikifarm: https://meta.miraheze.org/wiki/Miraheze
Last update: 2015-09-29
Details:
There is a dynamic list at https://meta.miraheze.org/wiki/Special:SiteMatrix
Run script: python miraheze-spider.py > newlist
Loading…
Cancel
Save