mirror of
https://github.com/WikiTeam/wikiteam
synced 2024-11-15 00:15:00 +00:00
adding spider for wikkii, updating the list (10 diff wikis, 2 new, 8 dead), adding info for list
This commit is contained in:
parent
c7fc194f0d
commit
c420d4d843
37
listsofwikis/wikkii-spider.py
Normal file
37
listsofwikis/wikkii-spider.py
Normal file
@ -0,0 +1,37 @@
|
|||||||
|
#!/usr/bin/env python2
|
||||||
|
# -*- coding: utf-8 -*-
|
||||||
|
|
||||||
|
# Copyright (C) 2014 WikiTeam developers
|
||||||
|
# This program is free software: you can redistribute it and/or modify
|
||||||
|
# it under the terms of the GNU General Public License as published by
|
||||||
|
# the Free Software Foundation, either version 3 of the License, or
|
||||||
|
# (at your option) any later version.
|
||||||
|
#
|
||||||
|
# This program is distributed in the hope that it will be useful,
|
||||||
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
# GNU General Public License for more details.
|
||||||
|
#
|
||||||
|
# You should have received a copy of the GNU General Public License
|
||||||
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
|
||||||
|
import json
|
||||||
|
import random
|
||||||
|
import re
|
||||||
|
import requests
|
||||||
|
import time
|
||||||
|
|
||||||
|
def main():
|
||||||
|
headers = {
|
||||||
|
'User-Agent': 'Mozilla/5.0 (X11; Linux i686; rv:24.0) Gecko/20100101 Firefox/24.0',
|
||||||
|
}
|
||||||
|
|
||||||
|
url = 'http://wikkii.com/wiki/Special:Farmer/list'
|
||||||
|
r = requests.get(url, headers=headers)
|
||||||
|
raw = r.text
|
||||||
|
m = re.findall(ur'<dt> <a href="([^>]+?)" class="extiw"', raw)
|
||||||
|
for i in m:
|
||||||
|
print i
|
||||||
|
|
||||||
|
if __name__ == '__main__':
|
||||||
|
main()
|
@ -52,7 +52,6 @@ http://actabe.wikkii.com
|
|||||||
http://activatumente.wikkii.com
|
http://activatumente.wikkii.com
|
||||||
http://acuvueoasys.wikkii.com
|
http://acuvueoasys.wikkii.com
|
||||||
http://ac.wikkii.com
|
http://ac.wikkii.com
|
||||||
http://ac.wikkii.net
|
|
||||||
http://acworld.wikkii.com
|
http://acworld.wikkii.com
|
||||||
http://addward.wikkii.com
|
http://addward.wikkii.com
|
||||||
http://adivo.wikkii.com
|
http://adivo.wikkii.com
|
||||||
@ -610,7 +609,6 @@ http://ctaahr.wikkii.com
|
|||||||
http://ctcgroupproject.wikkii.com
|
http://ctcgroupproject.wikkii.com
|
||||||
http://cuarento.wikkii.com
|
http://cuarento.wikkii.com
|
||||||
http://cubicopedia.wikkii.com
|
http://cubicopedia.wikkii.com
|
||||||
http://cubipedia.wikkii.com
|
|
||||||
http://cuppedia.wikkii.com
|
http://cuppedia.wikkii.com
|
||||||
http://cure.wikkii.com
|
http://cure.wikkii.com
|
||||||
http://curiosityshop.wikkii.com
|
http://curiosityshop.wikkii.com
|
||||||
@ -1110,7 +1108,6 @@ http://gigipedia.wikkii.com
|
|||||||
http://gijinka.wikkii.com
|
http://gijinka.wikkii.com
|
||||||
http://gikopedia.wikkii.com
|
http://gikopedia.wikkii.com
|
||||||
http://gintama.wikkii.com
|
http://gintama.wikkii.com
|
||||||
http://gintama.wikkii.net
|
|
||||||
http://gknova6wiki.wikkii.com
|
http://gknova6wiki.wikkii.com
|
||||||
http://gkwiki.wikkii.com
|
http://gkwiki.wikkii.com
|
||||||
http://glacierwolf.wikkii.com
|
http://glacierwolf.wikkii.com
|
||||||
@ -1167,6 +1164,7 @@ http://gruposlcc.wikkii.com
|
|||||||
http://gsdiam.wikkii.com
|
http://gsdiam.wikkii.com
|
||||||
http://gsuphilosophy.wikkii.com
|
http://gsuphilosophy.wikkii.com
|
||||||
http://gs.wikkii.com
|
http://gs.wikkii.com
|
||||||
|
http://gta.wikkii.com
|
||||||
http://gtmdms.wikkii.com
|
http://gtmdms.wikkii.com
|
||||||
http://gudrapdija.wikkii.com
|
http://gudrapdija.wikkii.com
|
||||||
http://gudrapedia.wikkii.com
|
http://gudrapedia.wikkii.com
|
||||||
@ -1302,7 +1300,6 @@ http://iatr.wikkii.com
|
|||||||
http://iatw.wikkii.com
|
http://iatw.wikkii.com
|
||||||
http://ibizahotel.wikkii.com
|
http://ibizahotel.wikkii.com
|
||||||
http://iceclimber.wikkii.com
|
http://iceclimber.wikkii.com
|
||||||
http://icehockey.wikkii.com
|
|
||||||
http://iceman311.wikkii.com
|
http://iceman311.wikkii.com
|
||||||
http://icewedge.wikkii.com
|
http://icewedge.wikkii.com
|
||||||
http://ichatroom.wikkii.com
|
http://ichatroom.wikkii.com
|
||||||
@ -1464,7 +1461,6 @@ http://kacperix.wikkii.com
|
|||||||
http://kaidan.wikkii.com
|
http://kaidan.wikkii.com
|
||||||
http://kainon.wikkii.com
|
http://kainon.wikkii.com
|
||||||
http://kaktopedia.wikkii.com
|
http://kaktopedia.wikkii.com
|
||||||
http://kala.wikkii.com
|
|
||||||
http://kaleidos.wikkii.com
|
http://kaleidos.wikkii.com
|
||||||
http://kangaroophysics.wikkii.com
|
http://kangaroophysics.wikkii.com
|
||||||
http://kanithoshigh.wikkii.com
|
http://kanithoshigh.wikkii.com
|
||||||
@ -2021,7 +2017,6 @@ http://omwarch.wikkii.com
|
|||||||
http://oncechosendev.wikkii.com
|
http://oncechosendev.wikkii.com
|
||||||
http://onepiecewiki.wikkii.com
|
http://onepiecewiki.wikkii.com
|
||||||
http://onepiece.wikkii.com
|
http://onepiece.wikkii.com
|
||||||
http://onepiece.wikkii.net
|
|
||||||
http://oneshotrpg.wikkii.com
|
http://oneshotrpg.wikkii.com
|
||||||
http://onfan.wikkii.com
|
http://onfan.wikkii.com
|
||||||
http://onionleaks.wikkii.com
|
http://onionleaks.wikkii.com
|
||||||
@ -2335,7 +2330,6 @@ http://recette.wikkii.com
|
|||||||
http://reduction12.wikkii.com
|
http://reduction12.wikkii.com
|
||||||
http://redzero.wikkii.com
|
http://redzero.wikkii.com
|
||||||
http://regularshow.wikkii.com
|
http://regularshow.wikkii.com
|
||||||
http://rejuveverse.wikkii.com
|
|
||||||
http://remnantknights.wikkii.com
|
http://remnantknights.wikkii.com
|
||||||
http://rengine.wikkii.com
|
http://rengine.wikkii.com
|
||||||
http://reno.wikkii.com
|
http://reno.wikkii.com
|
||||||
@ -2607,7 +2601,6 @@ http://sr50.wikkii.com
|
|||||||
http://sraven.wikkii.com
|
http://sraven.wikkii.com
|
||||||
http://sroinfo.wikkii.com
|
http://sroinfo.wikkii.com
|
||||||
http://srtolkien.wikkii.com
|
http://srtolkien.wikkii.com
|
||||||
http://sr.wikkii.com
|
|
||||||
http://ssklearningcentre.wikkii.com
|
http://ssklearningcentre.wikkii.com
|
||||||
http://ssr.wikkii.com
|
http://ssr.wikkii.com
|
||||||
http://staffchristmas.wikkii.com
|
http://staffchristmas.wikkii.com
|
||||||
@ -2618,6 +2611,7 @@ http://stargatefanon.wikkii.com
|
|||||||
http://stargate.wikkii.com
|
http://stargate.wikkii.com
|
||||||
http://starjunky.wikkii.com
|
http://starjunky.wikkii.com
|
||||||
http://starship.wikkii.com
|
http://starship.wikkii.com
|
||||||
|
http://starsreach.wikkii.com
|
||||||
http://stasikosarticles.wikkii.com
|
http://stasikosarticles.wikkii.com
|
||||||
http://statnice.wikkii.com
|
http://statnice.wikkii.com
|
||||||
http://stavba.wikkii.com
|
http://stavba.wikkii.com
|
||||||
|
@ -1,4 +1,7 @@
|
|||||||
Wikifarm: http://wikkii.com/wiki/Free_Wiki_Hosting
|
Wikifarm: http://wikkii.com/wiki/Free_Wiki_Hosting
|
||||||
Last update: unknown
|
Last update: 2014-06-27
|
||||||
|
|
||||||
Details:
|
Details:
|
||||||
|
|
||||||
|
Dynamic list http://wikkii.com/wiki/Special:Farmer/list
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user