Pywikipedia-svn July 2009

pywikipedia-svn@lists.wikimedia.org

9 participants
94 discussions

SVN: [7071] trunk/pywikipedia/wikipedia.py

by alexsh＠svn.wikimedia.org

Revision: 7071 Author: alexsh Date: 2009-07-15 21:05:47 +0000 (Wed, 15 Jul 2009) Log Message: ----------- forget to cleanup variable..orz Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2009-07-15 21:02:49 UTC (rev 7070) +++ trunk/pywikipedia/wikipedia.py 2009-07-15 21:05:47 UTC (rev 7071) @@ -5823,8 +5823,7 @@ 'eulimit': limit, 'euquery': url, } - keepGo = True - while keepGo: + while True: data = query.GetData(params, useAPI = True) if data['query']['exturlusage'] == []: break

14 years, 10 months

SVN: [7070] trunk/pywikipedia/wikipedia.py

by alexsh＠svn.wikimedia.org

Revision: 7070 Author: alexsh Date: 2009-07-15 21:02:49 +0000 (Wed, 15 Jul 2009) Log Message: ----------- site().linksearch: make more efficient for detect JSON data pages Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2009-07-15 20:43:32 UTC (rev 7069) +++ trunk/pywikipedia/wikipedia.py 2009-07-15 21:02:49 UTC (rev 7070) @@ -5829,13 +5829,8 @@ if data['query']['exturlusage'] == []: break - if data.has_key(u'query-continue'): - params['euoffset'] = data[u'query-continue'][u'exturlusage'][u'euoffset'] - else: - keepGo = False - data = data['query']['exturlusage'] - for pages in data: + for pages in data['query']['exturlusage']: if not siteurl in pages['title']: # the links themselves have similar form if pages['title'] in cache: @@ -5843,6 +5838,10 @@ else: cache.append(pages['title']) yield Page(self, pages['title']) + if data.has_key(u'query-continue'): + params['euoffset'] = data[u'query-continue'][u'exturlusage'][u'euoffset'] + else: + break else: output(u'Querying [[Special:Linksearch]]...') for url in urlsToRetrieve:

14 years, 10 months

SVN: [7069] branches/rewrite/pywikibot

by russblau＠svn.wikimedia.org

Revision: 7069 Author: russblau Date: 2009-07-15 20:43:32 +0000 (Wed, 15 Jul 2009) Log Message: ----------- Merge family changes from trunk Modified Paths: -------------- branches/rewrite/pywikibot/families/test_family.py branches/rewrite/pywikibot/families/wikibooks_family.py branches/rewrite/pywikibot/families/wikinews_family.py branches/rewrite/pywikibot/families/wikipedia_family.py branches/rewrite/pywikibot/families/wikiquote_family.py branches/rewrite/pywikibot/families/wikisource_family.py branches/rewrite/pywikibot/families/wikiversity_family.py branches/rewrite/pywikibot/families/wiktionary_family.py branches/rewrite/pywikibot/family.py Added Paths: ----------- branches/rewrite/pywikibot/families/scratchpad_wikia_family.py Property Changed: ---------------- branches/rewrite/pywikibot/families/ branches/rewrite/pywikibot/family.py Property changes on: branches/rewrite/pywikibot/families ___________________________________________________________________ Modified: svn:mergeinfo - /trunk/pywikipedia/families:5896-6197,6212-6972 + /trunk/pywikipedia/families:5896-6197,6212-7067 Copied: branches/rewrite/pywikibot/families/scratchpad_wikia_family.py (from rev 7067, trunk/pywikipedia/families/scratchpad_wikia_family.py) =================================================================== --- branches/rewrite/pywikibot/families/scratchpad_wikia_family.py (rev 0) +++ branches/rewrite/pywikibot/families/scratchpad_wikia_family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -0,0 +1,84 @@ +# -*- coding: utf-8 -*- +import family, config + +class Family(family.Family): + def __init__(self): + family.Family.__init__(self) + self.name = 'scratchpad_wikia' + + self.langs = { + 'de':'de.mini.wikia.com', + 'en':'scratchpad.wikia.com', + 'fr':'bloc-notes.wikia.com', + 'ja':'ja.scratchpad.wikia.com', + 'zh':'zh.scratchpad.wikia.com', + } + + # Most namespaces are inherited from family.Family. + self.namespaces[1]['fr'] = u'Discuter' + + self.namespaces[3]['fr'] = u'Discussion Utilisateur' + + self.namespaces[4] = { + '_default': u'Scratchpad', + 'de': u'Mini-Wikia', + 'fr': u'Bloc notes', + 'ja': u'Scratchpad Wiki', + 'zh': u'圍紀實驗室', + } + self.namespaces[5] = { + '_default': u'Scratchpad talk', + 'de': u'Mini-Wikia Diskussion', + 'en': u'Scratchpad talk', + 'fr': u'Discussion Bloc notes', + 'ja': u'Scratchpad Wiki‐ノート', + 'zh': u'圍紀實驗室 talk', + } + self.namespaces[7]['fr'] = u'Discussion Fichier' + + self.namespaces[11]['fr'] = u'Discussion Modèle' + + self.namespaces[13]['fr'] = u'Discussion Aide' + + self.namespaces[15]['fr'] = u'Discussion Catégorie' + + self.namespaces[400] = { + '_default': u'Video', + } + self.namespaces[401] = { + '_default': u'Video talk', + } + self.namespaces[500] = { + '_default': u'User blog', + 'de': u'Benutzer Blog', + } + self.namespaces[501] = { + '_default': u'User blog comment', + 'de': u'Benutzer Blog Kommentare', + } + self.namespaces[502] = { + '_default': u'Blog', + } + self.namespaces[503] = { + '_default': u'Blog talk', + 'de': u'Blog Diskussion', + } + self.namespaces[110] = { + '_default': u'Forum', + } + self.namespaces[111] = { + '_default': u'Forum talk', + } + # A few selected big languages for things that we do not want to loop over + # all languages. This is only needed by the titletranslate.py module, so + # if you carefully avoid the options, you could get away without these + # for another wikimedia family. + + self.languages_by_size = ['en','de'] + + def version(self, code): + return "1.14.0" + + def scriptpath(self, code): + return '' + Modified: branches/rewrite/pywikibot/families/test_family.py =================================================================== --- branches/rewrite/pywikibot/families/test_family.py 2009-07-15 20:23:26 UTC (rev 7068) +++ branches/rewrite/pywikibot/families/test_family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -1,7 +1,10 @@ # -*- coding: utf-8 -*- -from pywikibot import family +__version__ = '$Id$' +from pywikibot import family, config +import family, config + # The test wikipedia family class Family(family.Family): @@ -11,6 +14,8 @@ self.langs = { 'test': 'test.wikipedia.org', } + if config.SSL_connection: + self.langs['test'] = None def version(self, code): return '1.13alpha' Modified: branches/rewrite/pywikibot/families/wikibooks_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikibooks_family.py 2009-07-15 20:23:26 UTC (rev 7068) +++ branches/rewrite/pywikibot/families/wikibooks_family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -1,5 +1,4 @@ # -*- coding: utf-8 -*- -import urllib from pywikibot import family __version__ = '$Id$' @@ -12,14 +11,14 @@ self.name = 'wikibooks' self.languages_by_size = [ - 'en', 'de', 'fr', 'hu', 'pt', 'es', 'ja', 'nl', 'it', 'pl', - 'sq', 'he', 'fi', 'vi', 'ru', 'cs', 'hr', 'da', 'zh', 'sv', - 'mk', 'tr', 'th', 'sr', 'fa', 'tl', 'id', 'is', 'ca', 'ta', + 'en', 'de', 'fr', 'hu', 'pt', 'ja', 'es', 'nl', 'it', 'pl', + 'he', 'sq', 'fi', 'vi', 'ru', 'cs', 'hr', 'th', 'zh', 'da', + 'sv', 'mk', 'tr', 'sr', 'fa', 'tl', 'id', 'is', 'ca', 'ta', 'ar', 'no', 'ko', 'eo', 'ka', 'simple', 'bg', 'gl', 'lt', 'ro', 'sk', 'la', 'el', 'ia', 'ang', 'sl', 'et', 'mr', 'cv', 'ur', - 'oc', 'ml', 'ms', 'uk', 'eu', 'fy', 'lv', 'ie', 'hi', 'tg', - 'bn', 'hy', 'af', 'az', 'te', 'bs', 'ky', 'pa', 'be', 'sa', - 'zh-min-nan', 'ast', 'cy', 'mg', 'tt', 'km', 'si', 'ku', 'co', 'sw', + 'oc', 'ml', 'uk', 'ms', 'eu', 'fy', 'lv', 'hi', 'ie', 'tg', + 'bn', 'hy', 'af', 'az', 'te', 'pa', 'bs', 'ky', 'be', 'sa', + 'zh-min-nan', 'ast', 'cy', 'tt', 'mg', 'km', 'si', 'ku', 'co', 'sw', 'tk', 'ne', 'als', 'uz', 'vo', 'su', 'na', 'mn', 'lb', 'kn', 'ps', 'xh', 'kk', 'za', 'nds', 'wa', 'zu', 'my', ] @@ -34,16 +33,16 @@ # languages are put in the order given there. All other languages are put # after those, in code-alphabetical order. - alphabetic = ['af','ar','roa-rup','om','bg','be','bn','bs', - 'ca','chr','co','cs','cy','da','de','als','et', - 'el','en','es','eo','eu','fa','fr','fy','gv', - 'gd','gl','ko','hi','hr','io','id','ia','is','it', - 'he','jv','ka','csb','sw','la','lv','lt','hu', - 'mk','mg','ml','mi','mr','ms','zh-cfr','mn','nah','na', - 'nl','ja','no','nb','oc','nds','pl','pt','ro','ru', - 'sa','st','sq','si','simple','sk','sl','sr','su', - 'fi','sv','ta','tt','th','ur','vi', - 'tpi','tr','uk','vo','yi','za','zh','zh-cn', + alphabetic = ['af', 'ar', 'roa-rup', 'om', 'bg', 'be', 'bn', 'bs', + 'ca', 'chr', 'co', 'cs', 'cy', 'da', 'de', 'als', 'et', + 'el', 'en', 'es', 'eo', 'eu', 'fa', 'fr', 'fy', 'gv', + 'gd', 'gl', 'ko', 'hi', 'hr', 'io', 'id', 'ia', 'is', 'it', + 'he', 'jv', 'ka', 'csb', 'sw', 'la', 'lv', 'lt', 'hu', + 'mk', 'mg', 'ml', 'mi', 'mr', 'ms', 'zh-cfr', 'mn', 'nah', 'na', + 'nl', 'ja', 'no', 'nb', 'oc', 'nds', 'pl', 'pt', 'ro', 'ru', + 'sa', 'st', 'sq', 'si', 'simple', 'sk', 'sl', 'sr', 'su', + 'fi', 'sv', 'ta', 'tt', 'th', 'ur', 'vi', + 'tpi', 'tr', 'uk', 'vo', 'yi', 'za', 'zh', 'zh-cn', 'zh-tw'] self.obsolete = { @@ -62,17 +61,23 @@ 'gn': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Gu… 'gu': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Gu… 'jp': 'ja', + 'km': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Kh… 'ks': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Ka… + 'lb': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_L%… 'ln': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Li… + 'lv': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_La… 'mi': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Ma… 'minnan':'zh-min-nan', 'nah': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Na… 'nb': 'no', + 'ps': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Pa… 'qu': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Qu… 'rm': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Ru… 'se': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Sa… 'tokipona': None, 'ug': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Uy… + 'wa': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Wa… + 'xh': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Xh… 'yo': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Yo… 'zh-tw': 'zh', 'zh-cn': 'zh' @@ -88,7 +93,7 @@ 'simple': alphabetic } # Global bot allowed languages on http://meta.wikimedia.org/wiki/Bot_policy/Implementation#Current_implementa… - self.cross_allowed = ['fa','fy','it','ru','simple','zh'] + self.cross_allowed = ['fa', 'fy', 'it', 'ru', 'simple', 'zh'] def version(self, code): return '1.16alpha' Modified: branches/rewrite/pywikibot/families/wikinews_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikinews_family.py 2009-07-15 20:23:26 UTC (rev 7068) +++ branches/rewrite/pywikibot/families/wikinews_family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -1,5 +1,4 @@ # -*- coding: utf-8 -*- -import urllib from pywikibot import family __version__ = '$Id$' @@ -12,7 +11,7 @@ self.name = 'wikinews' self.languages_by_size = [ - 'en', 'pl', 'de', 'it', 'sr', 'fr', 'pt', 'es', 'zh', 'sv', + 'en', 'pl', 'de', 'sr', 'it', 'fr', 'pt', 'es', 'zh', 'sv', 'ja', 'ru', 'nl', 'he', 'fi', 'sd', 'ar', 'cs', 'no', 'uk', 'ca', 'hu', 'ro', 'th', 'bs', 'bg', 'ta', ] @@ -42,7 +41,7 @@ } # Global bot allowed languages on http://meta.wikimedia.org/wiki/Bot_policy/Implementation#Current_implementa… - self.cross_allowed = ['cs','hu',] + self.cross_allowed = ['cs', 'hu',] def code2encoding(self, code): return 'utf-8' Modified: branches/rewrite/pywikibot/families/wikipedia_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikipedia_family.py 2009-07-15 20:23:26 UTC (rev 7068) +++ branches/rewrite/pywikibot/families/wikipedia_family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -1,5 +1,4 @@ # -*- coding: utf-8 -*- -import urllib from pywikibot import family __version__ = '$Id$' @@ -14,30 +13,30 @@ self.languages_by_size = [ 'en', 'de', 'fr', 'pl', 'ja', 'it', 'nl', 'pt', 'es', 'ru', 'sv', 'zh', 'no', 'fi', 'ca', 'uk', 'tr', 'cs', 'hu', 'ro', - 'vo', 'eo', 'da', 'sk', 'id', 'ar', 'ko', 'he', 'lt', 'vi', - 'sl', 'sr', 'bg', 'et', 'fa', 'hr', 'simple', 'new', 'ht', 'nn', + 'vo', 'eo', 'da', 'sk', 'id', 'ko', 'ar', 'he', 'vi', 'lt', + 'sl', 'sr', 'bg', 'et', 'fa', 'hr', 'new', 'simple', 'ht', 'nn', 'gl', 'th', 'te', 'el', 'ms', 'eu', 'ceb', 'hi', 'mk', 'ka', - 'la', 'bs', 'lb', 'br', 'is', 'az', 'bpy', 'mr', 'sq', 'cy', + 'la', 'lb', 'bs', 'br', 'is', 'az', 'sq', 'cy', 'mr', 'bpy', 'sh', 'tl', 'lv', 'pms', 'be-x-old', 'bn', 'jv', 'oc', 'ta', 'io', - 'be', 'an', 'nds', 'su', 'scn', 'nap', 'ku', 'af', 'ast', 'fy', - 'sw', 'wa', 'zh-yue', 'bat-smg', 'qu', 'ur', 'cv', 'ml', 'ksh', 'tg', - 'ga', 'vec', 'roa-tara', 'war', 'uz', 'gd', 'pam', 'kn', 'mi', 'gu', - 'yi', 'yo', 'glk', 'lmo', 'nah', 'co', 'zh-min-nan', 'hsb', 'als', 'roa-rup', - 'ia', 'li', 'hy', 'gan', 'kk', 'sah', 'tt', 'tk', 'sa', 'wuu', - 'nds-nl', 'fo', 'os', 'vls', 'nrm', 'fiu-vro', 'am', 'rm', 'map-bms', 'pag', - 'arz', 'dv', 'mn', 'se', 'diq', 'ne', 'gv', 'fur', 'sco', 'lij', - 'bar', 'nov', 'bh', 'mt', 'ilo', 'pi', 'zh-classical', 'mzn', 'km','frp', - 'csb', 'lad', 'ug', 'si', 'pdc', 'kw', 'ang', 'haw', 'bcl', 'sc', - 'to', 'kv', 'mg', 'pa', 'ps', 'szl', 'ie', 'gn', 'my', 'ln', - 'hif', 'stq', 'wo', 'jbo', 'crh', 'arc', 'tpi', 'ty', 'ext', 'cbk-zam', - 'ky', 'eml', 'zea', 'srn', 'ay', 'myv', 'hak', 'ig', 'kg', 'pap', + 'be', 'an', 'nds', 'su', 'scn', 'nap', 'ku', 'af', 'fy', 'ast', + 'sw', 'wa', 'zh-yue', 'bat-smg', 'qu', 'ur', 'cv', 'ml', 'ksh', 'war', + 'tg', 'ga', 'vec', 'roa-tara', 'uz', 'gd', 'gu', 'pam', 'kn', 'mi', + 'yi', 'yo', 'lmo', 'glk', 'nah', 'zh-min-nan', 'co', 'hsb', 'roa-rup', 'als', + 'kk', 'ia', 'li', 'hy', 'gan', 'sah', 'tt', 'tk', 'sa', 'wuu', + 'nds-nl', 'fo', 'os', 'vls', 'fiu-vro', 'arz', 'nrm', 'bcl', 'am', 'rm', + 'pag', 'map-bms', 'dv', 'mn', 'gv', 'se', 'diq', 'fur', 'ne', 'sco', + 'bar', 'lij', 'nov', 'bh', 'mt', 'ilo', 'pi', 'mzn', 'zh-classical', 'km', + 'ug', 'csb', 'frp', 'lad', 'si', 'pdc', 'kw', 'ang', 'haw', 'sc', + 'mg', 'to', 'kv', 'szl', 'pa', 'ps', 'ie', 'my', 'gn', 'ln', + 'hif', 'stq', 'wo', 'jbo', 'arc', 'crh', 'tpi', 'ty', 'ext', 'cbk-zam', + 'ky', 'eml', 'zea', 'srn', 'ay', 'myv', 'hak', 'pap', 'ig', 'kg', 'so', 'or', 'kab', 'lo', 'rmy', 'ba', 'ce', 'sm', 'udm', 'av', - 'ks', 'cu', 'got', 'kaa', 'tet', 'dsb', 'sd', 'mdf', 'bo', 'iu', - 'nv', 'na', 'bm', 'cdo', 'chr', 'as', 'ee', 'om', 'pnt', 'pih', - 'zu', 'ab', 'ti', 'kl', 'ts', 'ss', 'bi', 'cr', 'dz', 've', - 'za', 'ch', 'ha', 'xh', 'tn', 'bug', 'xal', 'st', 'rw', 'ik', - 'bxr', 'chy', 'tw', 'ak', 'ny', 'fj', 'ff', 'sn', 'sg', 'lbe', - 'rn', 'ki', 'lg', 'tum', 'ng', + 'ks', 'nv', 'dsb', 'cu', 'got', 'kaa', 'tet', 'sd', 'bo', 'mdf', + 'iu', 'na', 'bm', 'as', 'cdo', 'chr', 'ee', 'om', 'pnt', 'pih', + 'kl', 'zu', 'ab', 'ti', 'ts', 'ss', 'za', 'bi', 'cr', 'dz', + 'xal', 've', 'ch', 'ha', 'xh', 'tn', 'bug', 'st', 'bxr', 'ik', + 'rw', 'chy', 'tw', 'ak', 'fj', 'ny', 'ff', 'sn', 'sg', 'lbe', + 'rn', 'ki', 'lg', 'tum', 'ng', 'mhr', ] for lang in self.languages_by_size: @@ -332,20 +331,20 @@ # Global bot allowed languages on http://meta.wikimedia.org/wiki/Bot_policy/Implementation#Current_implementa… self.cross_allowed = [ - 'ab','af','ak','am','ang','arc','arz','as','av','ay','az','ba','bar','bcl', - 'be-x-old','be','bg','bh','bi','bm','bo','bpy','bug','bxr','cbk-zam', - 'cdo','ce','ch','chy','co','crh','cr','csb','cu','diq','dsb','dz', - 'ee','eml','eu','ext','fa','ff','fj','fo','frp','fur','gan','ga','glk', - 'gn','got','gu','gv','ha','hak','haw','hif','hi','hsb','ht','hu','hy', - 'ia','id','ie','ig','ik','ilo','iow','is','iu','jbo','jv','kaa','kab','ka','kg','ki', - 'kl','km','kn','ko','ks','ku','kv','kw','ky','lad','lbe','lg','li','lij', - 'lmo','ln','lo','lv','map-bms','mdf','mg','mk','mn','mt','myv','my','mzn','nah', - 'na','nap','nds-nl','ne','new','nl','nov','nrm','nv','ny','om','or','os','pam','pap', - 'pa','pdc','pnt','ps','qu','rm','rmy','rn','roa-rup','roa-tara','sah', - 'sa','sc','sco','sd','se','sg','sh','simple','si','sk','sm','sn','so', - 'srn','stq','st','su','sw','szl','ta','te','tet','tg','ti','tn','to', - 'tpi','ts','tt','tum','tw','ty','ug','uz','ve','vls','wa','war','wo','wuu', - 'xal','xh','yi','yo','za','zh','zu' + 'ab', 'af', 'ak', 'am', 'ang', 'arc', 'arz', 'as', 'ast,', 'av', 'ay', 'az', + 'ba', 'bar', 'bcl', 'be-x-old', 'be', 'bg', 'bh', 'bi', 'bm', 'bo', 'bpy', 'bug', 'bxr', + 'cbk-zam', 'cdo', 'ce', 'ch', 'chr', 'chy', 'co', 'crh', 'cr', 'csb', 'cu', 'cv', 'cy', + 'diq', 'dsb', 'dz', 'ee', 'eml', 'eu', 'ext', 'fa', 'ff', 'fj', 'fo', 'frp', 'fur', + 'gan', 'ga', 'glk', 'gn', 'got', 'gu', 'gv', 'ha', 'hak', 'haw', 'hif', 'hi', 'hsb', 'ht', 'hu', 'hy', + 'ia', 'id', 'ie', 'ig', 'ik', 'ilo', 'iow', 'is', 'iu', 'jbo', 'jv', + 'kaa', 'kab', 'ka', 'kg', 'ki', 'kl', 'km', 'kn', 'ko', 'ks', 'ku', 'kv', 'kw', 'ky', + 'lad', 'lbe', 'lg', 'li', 'lij', 'lmo', 'ln', 'lo', 'lv', 'map-bms', 'mdf', 'mg', 'mk', 'mn', 'mt', 'myv', 'my', 'mzn', + 'nah', 'na', 'nap', 'nds-nl', 'ne', 'new', 'ng', 'nl', 'nov', 'nrm', 'nv', 'ny', 'om', 'or', 'os', + 'pam', 'pap', 'pa', 'pdc', 'pnt', 'ps', 'qu', 'rm', 'rmy', 'rn', 'roa-rup', 'roa-tara', 'rw', + 'sah', 'sa', 'sc', 'sco', 'sd', 'se', 'sg', 'sh', 'simple', 'si', 'sk', 'sm', 'sn', 'so', 'srn', 'stq', 'st', 'su', 'sw', 'szl', + 'ta', 'te', 'tet', 'tg', 'ti', 'tk', 'tn', 'to', 'tpi', 'ts', 'tt', 'tum', 'tw', 'ty', + 'udm', 'ug', 'uz', 've', 'vls', 'wa', 'war', 'wo', 'wuu', + 'xal', 'xh', 'yi', 'yo', 'za', 'zh', 'zh-classic', 'zh-min-nan', 'zu', ] # On most Wikipedias page names must start with a capital letter, but some # languages don't use this. @@ -361,9 +360,9 @@ 'bh', 'bcl', 'bi', 'bar', 'bo', 'bs', 'br', 'bug', 'bg', 'bxr', 'ca', 'ceb', 'cv', 'cs', 'ch', 'cbk-zam', 'ny', 'sn', 'tum', 'cho', 'co', 'cy', 'da', 'dk', 'pdc', 'de', 'dv', 'nv', 'dsb', 'na', 'dz', - 'mh', 'et', 'el', 'eml', 'en', 'myv', 'es', 'eo', 'ext', 'eu', 'ee', - 'fa', 'hif', 'fo', 'fr', 'fy', 'ff', 'fur', 'ga', 'gv', 'sm', 'gd', - 'gl', 'gan', 'ki', 'glk', 'gu', 'got', 'hak', 'xal', 'ko', 'ha', + 'mh', 'mhr', 'et', 'el', 'eml', 'en', 'myv', 'es', 'eo', 'ext', 'eu', + 'ee','fa', 'hif', 'fo', 'fr', 'fy', 'ff', 'fur', 'ga', 'gv', 'sm', + 'gd','gl', 'gan', 'ki', 'glk', 'gu', 'got', 'hak', 'xal', 'ko', 'ha', 'haw', 'hy', 'hi', 'ho', 'hsb', 'hr', 'io', 'ig', 'ilo', 'bpy', 'ia', 'ie', 'iu', 'ik', 'os', 'xh', 'zu', 'is', 'it', 'he', 'kl', 'kn', 'kr', 'pam', 'ka', 'ks', 'csb', 'kk', 'kw', 'rw', 'ky', 'rn', @@ -410,14 +409,14 @@ 'hu': ['en'], 'lb': self.alphabetic, 'ms': self.alphabetic_revised, - 'nds': ['nds-nl','pdt'] + self.alphabetic, # Note: as of 2008-02-24, pdt: (Plautdietsch) is still in the Incubator. - 'nn': ['no','nb','sv','da'] + self.alphabetic, + 'nds': ['nds-nl', 'pdt'] + self.alphabetic, # Note: as of 2008-02-24, pdt: (Plautdietsch) is still in the Incubator. + 'nn': ['no', 'nb', 'sv', 'da'] + self.alphabetic, 'no': self.alphabetic, 'pl': self.alphabetic, 'simple': self.alphabetic, - 'te': ['en','hi', 'kn', 'ta', 'ml'], + 'te': ['en', 'hi', 'kn', 'ta', 'ml'], 'vi': self.alphabetic_revised, - 'yi': ['en','he','de'] + 'yi': ['en', 'he', 'de'] } self.obsolete = { Modified: branches/rewrite/pywikibot/families/wikiquote_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikiquote_family.py 2009-07-15 20:23:26 UTC (rev 7068) +++ branches/rewrite/pywikibot/families/wikiquote_family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -1,5 +1,4 @@ # -*- coding: utf-8 -*- -import urllib from pywikibot import family __version__ = '$Id$' @@ -13,12 +12,12 @@ self.languages_by_size = [ 'en', 'it', 'de', 'pl', 'pt', 'sk', 'ru', 'bg', 'es', 'bs', - 'sl', 'tr', 'he', 'lt', 'fr', 'cs', 'zh', 'uk', 'hu', 'id', + 'sl', 'tr', 'he', 'lt', 'fr', 'cs', 'zh', 'hu', 'uk', 'id', 'fa', 'sv', 'el', 'no', 'nl', 'ja', 'fi', 'eo', 'hy', 'et', - 'ca', 'nn', 'simple', 'ka', 'ar', 'ku', 'hr', 'ko', 'ro', 'gl', - 'ml', 'li', 'is', 'sr', 'af', 'th', 'te', 'da', 'sq', 'vi', + 'nn', 'ca', 'simple', 'ka', 'ar', 'ku', 'hr', 'ko', 'ro', 'gl', + 'sr', 'ml', 'li', 'is', 'th', 'af', 'te', 'da', 'sq', 'vi', 'eu', 'az', 'la', 'br', 'hi', 'be', 'ast', 'uz', 'ang', 'zh-min-nan', - 'lb', 'mr', 'su', 'ur', 'ta', 'wo', 'kn', 'ky', 'gu', 'cy', + 'lb', 'mr', 'su', 'gu', 'ur', 'ta', 'wo', 'kn', 'ky', 'cy', 'am', 'co', 'kk', ] Modified: branches/rewrite/pywikibot/families/wikisource_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikisource_family.py 2009-07-15 20:23:26 UTC (rev 7068) +++ branches/rewrite/pywikibot/families/wikisource_family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -1,5 +1,4 @@ # -*- coding: utf-8 -*- -import urllib from pywikibot import family __version__ = '$Id$' @@ -14,9 +13,9 @@ self.languages_by_size = [ 'en', 'pt', 'fr', 'zh', 'es', 'de', 'ru', 'he', 'it', 'ar', 'fa', 'hu', 'pl', 'th', 'cs', 'ro', 'hr', 'te', 'fi', 'tr', - 'nl', 'sv', 'sl', 'sr', 'la', 'uk', 'ja', 'li', 'el', 'ml', - 'ko', 'is', 'bs', 'id', 'ca', 'bn', 'hy', 'yi', 'az', 'mk', - 'no', 'da', 'vi', 'et', 'ta', 'bg', 'lt', 'kn', 'gl', 'cy', + 'nl', 'sv', 'ko', 'sl', 'sr', 'la', 'ja', 'uk', 'li', 'el', + 'ml', 'is', 'bs', 'id', 'ca', 'bn', 'yi', 'az', 'hy', 'no', + 'mk', 'da', 'vi', 'ta', 'et', 'bg', 'lt', 'kn', 'gl', 'cy', 'sk', 'zh-min-nan', 'fo', ] Modified: branches/rewrite/pywikibot/families/wikiversity_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikiversity_family.py 2009-07-15 20:23:26 UTC (rev 7068) +++ branches/rewrite/pywikibot/families/wikiversity_family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -1,5 +1,4 @@ # -*- coding: utf-8 -*- -import urllib from pywikibot import family __version__ = '$Id$' @@ -12,13 +11,12 @@ self.name = 'wikiversity' self.languages_by_size = [ - 'en', 'fr', 'de', 'cs', 'es', 'it', 'pt', 'el', 'fi', + 'en', 'fr', 'de', 'beta', 'cs', 'es', 'it', 'pt', 'el', 'fi', 'ja', ] for lang in self.languages_by_size: self.langs[lang] = '%s.wikiversity.org' % lang - self.langs['beta'] = 'beta.wikiversity.org' def version(self,code): return '1.16alpha' Modified: branches/rewrite/pywikibot/families/wiktionary_family.py =================================================================== --- branches/rewrite/pywikibot/families/wiktionary_family.py 2009-07-15 20:23:26 UTC (rev 7068) +++ branches/rewrite/pywikibot/families/wiktionary_family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -1,5 +1,4 @@ # -*- coding: utf-8 -*- -import urllib from pywikibot import family __version__ = '$Id$' @@ -12,20 +11,20 @@ self.name = 'wiktionary' self.languages_by_size = [ - 'fr', 'en', 'tr', 'lt', 'vi', 'ru', 'io', 'el', 'pl', 'zh', + 'fr', 'en', 'tr', 'lt', 'vi', 'ru', 'io', 'zh', 'el', 'pl', 'fi', 'no', 'hu', 'it', 'ta', 'sv', 'de', 'ko', 'lo', 'pt', 'nl', 'ku', 'es', 'ja', 'id', 'te', 'et', 'ro', 'gl', 'bg', 'vo', 'ar', 'uk', 'ca', 'is', 'sr', 'fa', 'af', 'li', 'scn', - 'sw', 'fy', 'th', 'br', 'oc', 'he', 'simple', 'cs', 'sl', 'hy', - 'sq', 'tt', 'la', 'zh-min-nan', 'da', 'ast', 'ur', 'kk', 'ml', 'hsb', - 'ky', 'hr', 'wo', 'ang', 'eo', 'hi', 'tk', 'gn', 'ia', 'ga', - 'az', 'co', 'sk', 'csb', 'st', 'ms', 'nds', 'kl', 'sd', 'ug', - 'ti', 'mk', 'tl', 'an', 'my', 'gu', 'kn', 'ka', 'km', 'lv', - 'ts', 'cy', 'qu', 'wa', 'fo', 'bs', 'am', 'rw', 'mr', 'eu', - 'su', 'chr', 'mn', 'nah', 'ie', 'yi', 'om', 'be', 'gd', 'mg', - 'sh', 'zu', 'iu', 'bn', 'nn', 'pa', 'si', 'mt', 'mi', 'tpi', - 'dv', 'ps', 'jv', 'tg', 'so', 'roa-rup', 'ik', 'ha', 'gv', 'ss', - 'kw', 'sa', 'ay', 'uz', 'na', 'ne', 'jbo', 'tn', 'sm', 'sg', + 'sw', 'fy', 'th', 'br', 'oc', 'he', 'cs', 'simple', 'sl', 'hy', + 'sq', 'tt', 'la', 'zh-min-nan', 'da', 'ast', 'ur', 'hsb', 'kk', 'wa', + 'ml', 'ky', 'hr', 'wo', 'tk', 'ang', 'eo', 'kn', 'hi', 'gn', + 'ga', 'ia', 'az', 'co', 'sk', 'csb', 'st', 'ms', 'nds', 'kl', + 'sd', 'ug', 'ti', 'tl', 'mk', 'an', 'my', 'gu', 'ka', 'km', + 'lv', 'ts', 'cy', 'qu', 'fo', 'bs', 'am', 'rw', 'eu', 'mr', + 'su', 'chr', 'mn', 'nah', 'ie', 'yi', 'om', 'be', 'gd', 'sh', + 'iu', 'mg', 'nn', 'zu', 'bn', 'pa', 'si', 'mt', 'tpi', 'dv', + 'mi', 'jv', 'ps', 'roa-rup', 'tg', 'so', 'ik', 'ha', 'gv', 'uz', + 'ss', 'kw', 'sa', 'ay', 'na', 'ne', 'jbo', 'tn', 'sm', 'sg', 'lb', 'ks', 'fj', 'ln', 'za', 'dz', 'als', ] @@ -38,8 +37,8 @@ # Global bot allowed languages on http://meta.wikimedia.org/wiki/Bot_policy/Implementation#Current_implementa… self.cross_allowed = [ - 'ang','bg','bn','eo','fa','fy','gd','ia','ie','jv','ka','lt','mk', - 'nl','no','sk','th','ti','ts','uk','vo','za','zh-min-nan','zh', + 'ang', 'ast', 'bg', 'bn', 'eo', 'es', 'fa', 'fy', 'ga', 'gd', 'ia', 'ie', 'jv', 'ka', 'lt', 'mk', + 'nl', 'no', 'sk', 'tg', 'th', 'ti', 'ts', 'ug', 'uk', 'vo', 'za', 'zh-min-nan', 'zh', ] self.obsolete = { 'aa': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Af… Modified: branches/rewrite/pywikibot/family.py =================================================================== --- branches/rewrite/pywikibot/family.py 2009-07-15 20:23:26 UTC (rev 7068) +++ branches/rewrite/pywikibot/family.py 2009-07-15 20:43:32 UTC (rev 7069) @@ -561,7 +561,7 @@ 'cyril': [ 'ab', 'av', 'ba', 'be', 'be-x-old', 'bg', 'bxr', 'ce', 'cu', 'cv', 'kv', 'ky', 'mk', 'lbe', 'mdf', 'mn', 'mo', 'myv', 'os', 'ru', 'sah', 'tg', - 'tk', 'udm', 'uk', 'xal', + 'tk', 'udm', 'uk', 'xal', 'mhr', # languages using multiple scripts, including cyrillic 'ha', 'kk', 'sh', 'sr', 'tt' ], @@ -687,6 +687,7 @@ 'ay': [u'redirección'], 'ba': [u'перенаправление', u'перенапр'], 'bar': [u'weiterleitung'], + 'bat-smg': [u'peradresavimas'], 'bcc': [u'تغییرمسیر'], 'be-tarask': [u'перанакіраваньне'], 'be-x-old': [u'перанакіраваньне'], Property changes on: branches/rewrite/pywikibot/family.py ___________________________________________________________________ Modified: svn:mergeinfo - /trunk/pywikipedia/family.py:6057-6972 + /trunk/pywikipedia/family.py:6057-6972,6974-7067

14 years, 10 months

SVN: [7068] trunk/pywikipedia/wikipedia.py

by alexsh＠svn.wikimedia.org

Revision: 7068 Author: alexsh Date: 2009-07-15 20:23:26 +0000 (Wed, 15 Jul 2009) Log Message: ----------- site().linksearch: add API method (take 2 hours to debug...Orz) Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2009-07-15 19:25:32 UTC (rev 7067) +++ trunk/pywikipedia/wikipedia.py 2009-07-15 20:23:26 UTC (rev 7068) @@ -5808,44 +5808,74 @@ def linksearch(self, siteurl, limit=500): """Yield Pages from results of Special:Linksearch for 'siteurl'.""" - output(u'Querying [[Special:Linksearch]]...') cache = [] R = re.compile('title ?=\"([^<>]*?)\">[^<>]*</a></li>') urlsToRetrieve = [siteurl] if not siteurl.startswith('*.'): urlsToRetrieve.append('*.' + siteurl) - for url in urlsToRetrieve: - offset = 0 - while True: - path = self.linksearch_address(url, limit=limit, offset=offset) - get_throttle() - html = self.getUrl(path) - #restricting the HTML source : - #when in the source, this div marks the beginning of the input - loc = html.find('<div class="mw-spcontent">') - if loc > -1: - html = html[loc:] - #when in the source, marks the end of the linklist - loc = html.find('<div class="printfooter">') - if loc > -1: - html = html[:loc] + if config.use_api: + output(u'Querying API...') + for url in urlsToRetrieve: + params = { + 'action': 'query', + 'list' : 'exturlusage', + 'eulimit': limit, + 'euquery': url, + } + keepGo = True + while keepGo: + data = query.GetData(params, useAPI = True) + if data['query']['exturlusage'] == []: + break + + if data.has_key(u'query-continue'): + params['euoffset'] = data[u'query-continue'][u'exturlusage'][u'euoffset'] + else: + keepGo = False - #our regex fetches internal page links and the link they contain - links = R.findall(html) - if not links: - #no more page to be fetched for that link - break - for title in links: - if not siteurl in title: - # the links themselves have similar form - if title in cache: - continue - else: - cache.append(title) - yield Page(self, title) - offset += limit + data = data['query']['exturlusage'] + for pages in data: + if not siteurl in pages['title']: + # the links themselves have similar form + if pages['title'] in cache: + continue + else: + cache.append(pages['title']) + yield Page(self, pages['title']) + else: + output(u'Querying [[Special:Linksearch]]...') + for url in urlsToRetrieve: + offset = 0 + while True: + path = self.linksearch_address(url, limit=limit, offset=offset) + get_throttle() + html = self.getUrl(path) + #restricting the HTML source : + #when in the source, this div marks the beginning of the input + loc = html.find('<div class="mw-spcontent">') + if loc > -1: + html = html[loc:] + #when in the source, marks the end of the linklist + loc = html.find('<div class="printfooter">') + if loc > -1: + html = html[:loc] + #our regex fetches internal page links and the link they contain + links = R.findall(html) + if not links: + #no more page to be fetched for that link + break + for title in links: + if not siteurl in title: + # the links themselves have similar form + if title in cache: + continue + else: + cache.append(title) + yield Page(self, title) + offset += limit + def __repr__(self): return self.family.name+":"+self.lang

14 years, 10 months

SVN: [7067] trunk/pywikipedia/spamremove.py

by alexsh＠svn.wikimedia.org

Revision: 7067 Author: alexsh Date: 2009-07-15 19:25:32 +0000 (Wed, 15 Jul 2009) Log Message: ----------- Add check pages no return anything Modified Paths: -------------- trunk/pywikipedia/spamremove.py Modified: trunk/pywikipedia/spamremove.py =================================================================== --- trunk/pywikipedia/spamremove.py 2009-07-15 18:06:06 UTC (rev 7066) +++ trunk/pywikipedia/spamremove.py 2009-07-15 19:25:32 UTC (rev 7067) @@ -66,42 +66,45 @@ pages = list(set(mysite.linksearch(spamSite))) if namespaces: pages = list(set(pagegenerators.NamespaceFilterPageGenerator(pages, namespaces))) - wikipedia.getall(mysite, pages) - for p in pages: - text = p.get() - if not spamSite in text: - continue - # Show the title of the page we're working on. - # Highlight the title in purple. - wikipedia.output(u"\n\n>>> \03{lightpurple}%s\03{default} <<<" % p.title()) - lines = text.split('\n') - newpage = [] - lastok = "" - for line in lines: - if spamSite in line: - if lastok: - wikipedia.output(lastok) - wikipedia.output('\03{lightred}%s\03{default}' % line) - lastok = None + if len(pages) == 0: + wikipedia.output('No page found.') + else: + wikipedia.getall(mysite, pages) + for p in pages: + text = p.get() + if not spamSite in text: + continue + # Show the title of the page we're working on. + # Highlight the title in purple. + wikipedia.output(u"\n\n>>> \03{lightpurple}%s\03{default} <<<" % p.title()) + lines = text.split('\n') + newpage = [] + lastok = "" + for line in lines: + if spamSite in line: + if lastok: + wikipedia.output(lastok) + wikipedia.output('\03{lightred}%s\03{default}' % line) + lastok = None + else: + newpage.append(line) + if line.strip(): + if lastok is None: + wikipedia.output(line) + lastok = line + if automatic: + answer = "y" else: - newpage.append(line) - if line.strip(): - if lastok is None: - wikipedia.output(line) - lastok = line - if automatic: - answer = "y" - else: - answer = wikipedia.inputChoice(u'\nDelete the red lines?', ['yes', 'no', 'edit'], ['y', 'N', 'e'], 'n') - if answer == "n": - continue - elif answer == "e": - editor = editarticle.TextEditor() - newtext = editor.edit(text, highlight = spamSite, jumpIndex = text.find(spamSite)) - else: - newtext = "\n".join(newpage) - if newtext != text: - p.put(newtext, wikipedia.translate(mysite, msg) % spamSite) + answer = wikipedia.inputChoice(u'\nDelete the red lines?', ['yes', 'no', 'edit'], ['y', 'N', 'e'], 'n') + if answer == "n": + continue + elif answer == "e": + editor = editarticle.TextEditor() + newtext = editor.edit(text, highlight = spamSite, jumpIndex = text.find(spamSite)) + else: + newtext = "\n".join(newpage) + if newtext != text: + p.put(newtext, wikipedia.translate(mysite, msg) % spamSite) try: main()

14 years, 10 months

SVN: [7066] trunk/pywikipedia/wikipedia.py

by russblau＠svn.wikimedia.org

Revision: 7066 Author: russblau Date: 2009-07-15 18:06:06 +0000 (Wed, 15 Jul 2009) Log Message: ----------- Fix for bug 2821989 (templatesWithParameters failed to accept empty parameter clause) Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2009-07-14 19:34:51 UTC (rev 7065) +++ trunk/pywikipedia/wikipedia.py 2009-07-15 18:06:06 UTC (rev 7066) @@ -1928,7 +1928,7 @@ inside = {} count = 0 Rtemplate = re.compile( - ur'{{(msg:)?(?P<name>[^{\|]+?)(\|(?P<params>[^{]+?))?}}') + ur'{{(msg:)?(?P<name>[^{\|]+?)(\|(?P<params>[^{]*?))?}}') Rlink = re.compile(ur'\[\[[^\]]+\]\]') Rmath = re.compile(ur'<math>[^<]+</math>') Rmarker = re.compile(ur'%s(\d+)%s' % (marker, marker))

14 years, 10 months

SVN: [7065] trunk/pywikipedia/wikipedia.py

by alexsh＠svn.wikimedia.org

Revision: 7065 Author: alexsh Date: 2009-07-14 19:34:51 +0000 (Tue, 14 Jul 2009) Log Message: ----------- wikipedia.py *add API JSON method to site.mediawiki_message() *improve dict create in page.getRestrictions() Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2009-07-14 18:07:10 UTC (rev 7064) +++ trunk/pywikipedia/wikipedia.py 2009-07-14 19:34:51 UTC (rev 7065) @@ -1339,12 +1339,11 @@ raise Error("BUG> API problem.") if text[pageid]['protection'] != []: #if titles: - # restrictions[ pageid ] = { 'edit': None, 'move': None } - # for detail in text[pageid]['protection']: - # restrictions[ pageid ][ detail[ 'type' ] ] = [ detail[ 'level' ], detail[ 'expiry'] ] + # restrictions = dict([ detail['type'], [ detail['level'], detail['expiry'] ] ] + # for detail in text[pageid]['protection']) #else: - for detail in text[pageid]['protection']: - restrictions[ detail[ 'type' ] ] = [ detail[ 'level' ], detail['expiry'] ] + restrictions = dict([ detail['type'], [ detail['level'], detail['expiry'] ] ] + for detail in text[pageid]['protection']) return restrictions @@ -5012,7 +5011,21 @@ retry_idle_time = 1 while True: - if usePHP: + if config.use_api: + params = { + 'action':'query', + 'meta':'allmessages', + } + try: + datas = query.GetData(params, useAPI = True)['query']['allmessages'] + except KeyError: + raise ServerError("The APIs don't return data, the site may be down") + except NotImplementedError: + config.use_api = False + continue + self._mediawiki_messages = _dict([(tag['name'].lower(), tag['*']) + for tag in datas]) + elif usePHP: phppage = self.getUrl(self.get_address("Special:Allmessages") + "&ot=php") Rphpvals = re.compile(r"(?ms)'([^']*)' => '(.*?[^\\])',")

14 years, 10 months

SVN: [7064] trunk/pywikipedia/wikipedia.py

by alexsh＠svn.wikimedia.org

Revision: 7064 Author: alexsh Date: 2009-07-14 18:07:10 +0000 (Tue, 14 Jul 2009) Log Message: ----------- Remove some variables for get array data from query.GetData (directly get array detail in GetData ) Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2009-07-14 17:48:56 UTC (rev 7063) +++ trunk/pywikipedia/wikipedia.py 2009-07-14 18:07:10 UTC (rev 7064) @@ -2762,15 +2762,16 @@ 'rvlimit' :limit, 'titles' :self.title(), } - data = query.GetData(params, useAPI = True, encodeTitle = False) try: - # We don't know the page's id, if any other better idea please change it - pageid = data['query']['pages'].keys()[0] - nickdata = data['query']['pages'][pageid][u'revisions'] - return nickdata + data = query.GetData(params, useAPI = True, encodeTitle = False)['query']['pages'] except KeyError: raise NoPage(u'API Error, nothing found in the APIs') + # We don't know the page's id, if any other better idea please change it + pageid = data.keys()[0] + nickdata = data[pageid][u'revisions'] + return nickdata + class ImagePage(Page): """A subclass of Page representing an image descriptor wiki page. @@ -2823,7 +2824,7 @@ params = { 'action' :'query', 'prop' :'imageinfo', - 'titles' :self.title(), + 'titles' :self.title(), 'iiprop' :'url', } imagedata = query.GetData(params, useAPI = True, encodeTitle = False) @@ -6397,8 +6398,7 @@ 'list' :'allimages', 'aisha1' :hash_found, } - data = query.GetData(params, site = getSite(self.lang, self.family), useAPI = True, encodeTitle = False) - allimages = data['query']['allimages'] + allimages = query.GetData(params, site = getSite(self.lang, self.family), useAPI = True, encodeTitle = False)['query']['allimages'] files = list() for imagedata in allimages: image = imagedata[u'name']

14 years, 10 months

SVN: [7063] trunk/pywikipedia/wikipedia.py

by alexsh＠svn.wikimedia.org

Revision: 7063 Author: alexsh Date: 2009-07-14 17:48:56 +0000 (Tue, 14 Jul 2009) Log Message: ----------- *Change site._getBlock from XML to JSON *Change site.allpages from XML to JSON, no need BeautifulSoup.( tested in checkimages.py ) Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2009-07-14 16:59:57 UTC (rev 7062) +++ trunk/pywikipedia/wikipedia.py 2009-07-14 17:48:56 UTC (rev 7063) @@ -4497,9 +4497,13 @@ def _getBlock(self, sysop = False): """Get user block data from the API.""" try: - text = self.getUrl(u'%saction=query&meta=userinfo&uiprop=blockinfo' - % self.api_address(), sysop=sysop) - return 'blockedby=' in text + params = { + 'action': 'query', + 'meta': 'userinfo', + 'uiprop': 'blockinfo', + } + data = query.GetData(params, self, useAPI = True)['query']['userinfo'] + return data.has_key('blockby') except NotImplementedError: return False @@ -5605,34 +5609,30 @@ yield page return - api_url_basename = "%saction=query&format=xml&list=allpages" \ - "&aplimit=%i&apnamespace=%i" % \ - (self.api_address(), config.special_page_limit, - namespace) + params = { + 'action' : 'query', + 'list' : 'allpages', + 'aplimit' : config.special_page_limit, + 'apnamespace': namespace, + } if not includeredirects: - api_url_basename += '&apfilterredir=nonredirects' + params['apfilterredir'] = 'nonredirects' elif includeredirects == 'only': - api_url_basename += '&apfilterredir=redirects' + params['apfilterredir'] = 'redirects' while True: - api_url = '%s&apfrom=%s' % (api_url_basename, - urllib.quote(start.encode(self.encoding()))) - + params['apfrom'] = urllib.quote(start.encode(self.encoding())) if throttle: get_throttle() - text = self.getUrl(api_url) - - soup = BeautifulSoup(text, - convertEntities=BeautifulSoup.HTML_ENTITIES) - - for p in soup.api.query.allpages: + data = query.GetData(params, useAPI = True) + + for p in data['query']['allpages']: yield Page(self, p['title']) + + if data.has_key('query-continue'): + start = data['query-continue']['allpages']['apfrom'] - if soup.api.find('query-continue') is None: - # Last page reached. - break - start = soup.api.find('query-continue').allpages['apfrom'] def _allpagesOld(self, start='!', namespace=0, includeredirects=True, throttle=True):

14 years, 10 months

SVN: [7062] trunk/pywikipedia/wikipedia.py

by alexsh＠svn.wikimedia.org

Revision: 7062 Author: alexsh Date: 2009-07-14 16:59:57 +0000 (Tue, 14 Jul 2009) Log Message: ----------- Change page.getRestrictions() API data from XML to JSON(had comments about get multiple pages data), function tested in blockpageschecker.py Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2009-07-14 12:13:56 UTC (rev 7061) +++ trunk/pywikipedia/wikipedia.py 2009-07-14 16:59:57 UTC (rev 7062) @@ -1308,28 +1308,44 @@ ('autoconfirmed' or 'sysop') * expiry is the expiration time of the restriction """ + #, titles = None + #if titles: + # restrictions = {} + #else: restrictions = { 'edit': None, 'move': None } try: api_url = self.site().api_address() except NotImplementedError: return restrictions - api_url += 'action=query&prop=info&inprop=protection&format=xml&titles=%s' % self.urlname() - text = self.site().getUrl(api_url) - if 'missing=""' in text: - self._getexception = NoPage - raise NoPage('Page %s does not exist' % self.aslink()) - elif not 'pageid="' in text: - # I don't know what may happen here. - # We may want to have better error handling - raise Error("BUG> API problem.") - match = re.findall(r'<protection>(.*?)</protection>', text) + + predata = { + 'action': 'query', + 'prop': 'info', + 'inprop': 'protection', + 'titles': self.title(), + } + #if titles: + # predata['titles'] = query.ListToParam(titles) + + text = query.GetData(predata, useAPI = True)['query']['pages'] + + for pageid in text: + if text[pageid].has_key('missing'): + self._getexception = NoPage + raise NoPage('Page %s does not exist' % self.aslink()) + elif not text[pageid].has_key('pageid'): + # Don't know what may happen here. + # We may want to have better error handling + raise Error("BUG> API problem.") + if text[pageid]['protection'] != []: + #if titles: + # restrictions[ pageid ] = { 'edit': None, 'move': None } + # for detail in text[pageid]['protection']: + # restrictions[ pageid ][ detail[ 'type' ] ] = [ detail[ 'level' ], detail[ 'expiry'] ] + #else: + for detail in text[pageid]['protection']: + restrictions[ detail[ 'type' ] ] = [ detail[ 'level' ], detail['expiry'] ] - if match: - text = match[0] # If there's the block "protection" take the settings inside it. - api_found = re.compile(r'<pr type="(.*?)" level="(.*?)" expiry="(.*?)" />') - for entry in api_found.findall(text): - restrictions[ entry[0] ] = [ entry[1], entry[2] ] - return restrictions def put_async(self, newtext,

14 years, 10 months

← Newer
1
2
3
4
5
6
7
8
9
10
Older →

2024

2023

2022

2021

2020

2019

2018

2017

2016

2015

2014

2013

2012

2011

2010

2009

Pywikipedia-svn July 2009