Pywikipedia-svn March 2010

pywikipedia-svn@lists.wikimedia.org

6 participants
70 discussions

by xqt＠svn.wikimedia.org

Revision: 7993 Author: xqt Date: 2010-03-12 09:55:12 +0000 (Fri, 12 Mar 2010) Log Message: ----------- update family files from trunk Modified Paths: -------------- branches/rewrite/pywikibot/families/wikibooks_family.py branches/rewrite/pywikibot/families/wikinews_family.py branches/rewrite/pywikibot/families/wikipedia_family.py branches/rewrite/pywikibot/families/wikiquote_family.py branches/rewrite/pywikibot/families/wikisource_family.py branches/rewrite/pywikibot/families/wiktionary_family.py branches/rewrite/pywikibot/family.py Modified: branches/rewrite/pywikibot/families/wikibooks_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikibooks_family.py 2010-03-12 09:43:56 UTC (rev 7992) +++ branches/rewrite/pywikibot/families/wikibooks_family.py 2010-03-12 09:55:12 UTC (rev 7993) @@ -11,12 +11,12 @@ self.name = 'wikibooks' self.languages_by_size = [ - 'en', 'de', 'fr', 'hu', 'pt', 'ja', 'es', 'nl', 'pl', 'it', - 'he', 'sq', 'fi', 'vi', 'ru', 'cs', 'hr', 'zh', 'sv', 'da', - 'ca', 'tr', 'th', 'mk', 'sr', 'tl', 'fa', 'id', 'is', 'ar', - 'no', 'ta', 'ko', 'ka', 'gl', 'eo', 'lt', 'bg', 'ro', 'sk', + 'en', 'de', 'fr', 'pt', 'hu', 'ja', 'es', 'nl', 'pl', 'it', + 'he', 'sq', 'fi', 'vi', 'ru', 'cs', 'hr', 'zh', 'sv', 'ca', + 'da', 'tr', 'th', 'mk', 'sr', 'tl', 'fa', 'id', 'ar', 'is', + 'no', 'ta', 'gl', 'ko', 'ka', 'eo', 'lt', 'bg', 'ro', 'sk', 'el', 'la', 'ia', 'ang', 'cv', 'sl', 'et', 'mr', 'ur', 'uk', - 'ml', 'oc', 'az', 'ms', 'eu', 'fy', 'hi', 'ie', 'tg', 'bn', + 'ml', 'az', 'oc', 'ms', 'eu', 'fy', 'hi', 'ie', 'tg', 'bn', 'af', 'hy', 'pa', 'bs', 'te', 'sa', 'ky', 'be', 'ast', 'tt', 'zh-min-nan', 'cy', 'mg', 'si', 'ku', 'ne', 'co', 'tk', 'sw', 'su', 'als', 'vo', 'uz', 'na', 'mn', 'kk', 'nds', 'zu', 'my', Modified: branches/rewrite/pywikibot/families/wikinews_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikinews_family.py 2010-03-12 09:43:56 UTC (rev 7992) +++ branches/rewrite/pywikibot/families/wikinews_family.py 2010-03-12 09:55:12 UTC (rev 7993) @@ -12,8 +12,8 @@ self.languages_by_size = [ 'sr', 'en', 'pl', 'de', 'fr', 'it', 'pt', 'es', 'zh', 'ja', - 'sv', 'ru', 'fi', 'he', 'ar', 'cs', 'sd', 'hu', 'no', 'ta', - 'bg', 'uk', 'ro', 'ca', 'tr', 'th', 'bs', + 'sv', 'ru', 'fi', 'he', 'ar', 'cs', 'sd', 'hu', 'bg', 'ro', + 'ta', 'no', 'uk', 'ca', 'tr', 'th', 'bs', ] for lang in self.languages_by_size: Modified: branches/rewrite/pywikibot/families/wikipedia_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikipedia_family.py 2010-03-12 09:43:56 UTC (rev 7992) +++ branches/rewrite/pywikibot/families/wikipedia_family.py 2010-03-12 09:55:12 UTC (rev 7993) @@ -14,29 +14,29 @@ 'en', 'de', 'fr', 'pl', 'it', 'ja', 'nl', 'es', 'pt', 'ru', 'sv', 'zh', 'no', 'fi', 'ca', 'uk', 'hu', 'cs', 'tr', 'ro', 'ko', 'eo', 'da', 'ar', 'vo', 'id', 'vi', 'sk', 'sr', 'lt', - 'he', 'bg', 'fa', 'sl', 'hr', 'et', 'new', 'ms', 'simple', 'th', - 'gl', 'nn', 'hi', 'ht', 'eu', 'el', 'te', 'ceb', 'mk', 'la', + 'he', 'bg', 'fa', 'sl', 'hr', 'et', 'new', 'ms', 'th', 'simple', + 'gl', 'nn', 'hi', 'eu', 'ht', 'el', 'te', 'ceb', 'mk', 'la', 'ka', 'br', 'az', 'bs', 'lb', 'sh', 'is', 'mr', 'cy', 'sq', - 'lv', 'jv', 'bpy', 'tl', 'pms', 'be-x-old', 'ta', 'bn', 'oc', 'an', - 'be', 'io', 'sw', 'nds', 'scn', 'qu', 'fy', 'su', 'af', 'zh-yue', - 'ast', 'nap', 'gu', 'ku', 'war', 'ur', 'bat-smg', 'ml', 'wa', 'cv', - 'ksh', 'ga', 'lmo', 'tg', 'roa-tara', 'vec', 'kn', 'hy', 'gd', 'uz', - 'pam', 'yi', 'mi', 'zh-min-nan', 'nah', 'kk', 'als', 'glk', 'sah', 'li', - 'hsb', 'co', 'roa-rup', 'tt', 'yo', 'ia', 'os', 'bcl', 'arz', 'gan', - 'fiu-vro', 'mn', 'nds-nl', 'vls', 'tk', 'sa', 'fo', 'am', 'dv', 'nrm', - 'pag', 'pnb', 'rm', 'map-bms', 'ne', 'wuu', 'bar', 'gv', 'my', 'sco', - 'diq', 'se', 'fur', 'lij', 'si', 'nov', 'mt', 'bh', 'ug', 'mzn', - 'csb', 'ilo', 'pi', 'zh-classical', 'km', 'lad', 'sc', 'frp', 'mg', 'ang', - 'kw', 'pdc', 'haw', 'szl', 'ps', 'ckb', 'hif', 'pa', 'bo', 'ie', - 'kv', 'hak', 'to', 'crh', 'myv', 'stq', 'gn', 'ln', 'mhr', 'nv', - 'ace', 'arc', 'jbo', 'ky', 'ext', 'wo', 'ty', 'tpi', 'cbk-zam', 'so', - 'eml', 'zea', 'srn', 'kab', 'ay', 'pap', 'ig', 'ba', 'kg', 'or', - 'lo', 'udm', 'dsb', 'rmy', 'cu', 'kaa', 'ab', 'sm', 'ce', 'xal', - 'av', 'ks', 'tet', 'got', 'sd', 'kl', 'mdf', 'na', 'pnt', 'bm', - 'iu', 'mwl', 'pih', 'pcd', 'as', 'cdo', 'chr', 'ee', 'om', 'zu', - 'ti', 'za', 'ts', 'ss', 've', 'bi', 'ha', 'dz', 'ch', 'bxr', - 'cr', 'bug', 'xh', 'tn', 'ki', 'sg', 'ik', 'rw', 'st', 'tw', - 'ny', 'chy', 'ak', 'sn', 'fj', 'ff', 'lg', 'lbe', 'tum', 'rn', + 'jv', 'lv', 'bpy', 'tl', 'pms', 'be-x-old', 'ta', 'bn', 'oc', 'an', + 'be', 'io', 'war', 'sw', 'nds', 'scn', 'fy', 'qu', 'su', 'af', + 'gu', 'zh-yue', 'ast', 'nap', 'ku', 'ur', 'bat-smg', 'ml', 'wa', 'cv', + 'ksh', 'ga', 'lmo', 'tg', 'roa-tara', 'vec', 'hy', 'kn', 'gd', 'uz', + 'pam', 'yi', 'mi', 'zh-min-nan', 'kk', 'nah', 'als', 'sah', 'glk', 'li', + 'hsb', 'co', 'tt', 'roa-rup', 'yo', 'ia', 'os', 'arz', 'bcl', 'gan', + 'fiu-vro', 'mn', 'nds-nl', 'vls', 'tk', 'fo', 'sa', 'am', 'pnb', 'dv', + 'nrm', 'pag', 'ne', 'rm', 'map-bms', 'bar', 'wuu', 'gv', 'my', 'sco', + 'diq', 'se', 'fur', 'lij', 'si', 'nov', 'mt', 'ug', 'bh', 'mzn', + 'csb', 'ilo', 'zh-classical', 'pi', 'km', 'lad', 'sc', 'mg', 'frp', 'ang', + 'kw', 'pdc', 'haw', 'szl', 'ckb', 'ps', 'hif', 'bo', 'pa', 'ie', + 'hak', 'kv', 'to', 'crh', 'stq', 'myv', 'gn', 'ln', 'mhr', 'nv', + 'ace', 'arc', 'ext', 'jbo', 'ky', 'wo', 'ty', 'tpi', 'eml', 'cbk-zam', + 'so', 'zea', 'kab', 'srn', 'ay', 'pap', 'or', 'ig', 'ba', 'kg', + 'lo', 'udm', 'dsb', 'rmy', 'cu', 'kaa', 'ab', 'ce', 'sm', 'xal', + 'av', 'ks', 'tet', 'got', 'kl', 'sd', 'mdf', 'mwl', 'na', 'bm', + 'pnt', 'iu', 'pih', 'pcd', 'as', 'cdo', 'chr', 'ee', 'om', 'zu', + 'ti', 'ts', 'za', 'ss', 've', 'bi', 'ha', 'dz', 'cr', 'ch', + 'bxr', 'xh', 'bug', 'tn', 'ki', 'sg', 'ik', 'rw', 'st', 'ny', + 'tw', 'ak', 'fj', 'sn', 'ff', 'lg', 'lbe', 'tum', 'chy', 'rn', ] for lang in self.languages_by_size: @@ -144,7 +144,8 @@ 'bg': None, 'bn': [u'দ্ব্যর্থতা নিরসন', u'Disambig'], 'br': [u'Hvlstumm', u'Digejañ', u'Digejañ anvioù-badez', - u"Digejañ lec'hanvioù", u'Digejañ anvioù-tud'], + u"Digejañ lec'hanvioù", u'Digejañ anvioù-tud', + u'Disheñvelout'], 'bs': [u'Čvor'], 'ca': None, 'ceb': None, @@ -200,7 +201,7 @@ 'ku': None, 'kw': None, 'ksh': None, - 'la': [u'Discretiva', u'Disnomen', u'Disambig'], + 'la': None, 'lb': [u'Homonymie', u'Disambig', u'Homonymie Ofkierzungen'], 'li': [u'Verdudeliking', u'Verdudelikingpazjena', u'Vp'], 'lmo': [u'Desambiguació'], Modified: branches/rewrite/pywikibot/families/wikiquote_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikiquote_family.py 2010-03-12 09:43:56 UTC (rev 7992) +++ branches/rewrite/pywikibot/families/wikiquote_family.py 2010-03-12 09:55:12 UTC (rev 7993) @@ -13,12 +13,12 @@ self.languages_by_size = [ 'en', 'it', 'pl', 'de', 'pt', 'ru', 'sk', 'es', 'bg', 'bs', 'sl', 'tr', 'fr', 'he', 'lt', 'cs', 'zh', 'el', 'hu', 'fa', - 'uk', 'id', 'sv', 'nl', 'no', 'ja', 'eo', 'fi', 'simple', 'hy', - 'nn', 'et', 'ca', 'ka', 'ar', 'ko', 'ku', 'hr', 'gl', 'ro', - 'sr', 'cy', 'ml', 'li', 'is', 'th', 'te', 'af', 'da', 'az', - 'sq', 'eu', 'vi', 'la', 'br', 'hi', 'be', 'ast', 'uz', 'ta', - 'ang', 'zh-min-nan', 'mr', 'gu', 'lb', 'su', 'ur', 'wo', 'kn', 'ky', - 'am', 'co', + 'uk', 'id', 'sv', 'nl', 'no', 'ja', 'eo', 'fi', 'hy', 'nn', + 'et', 'ca', 'ka', 'ar', 'ko', 'ku', 'hr', 'gl', 'ro', 'sr', + 'cy', 'ml', 'li', 'is', 'th', 'te', 'af', 'da', 'az', 'sq', + 'eu', 'vi', 'la', 'br', 'hi', 'be', 'ast', 'uz', 'ta', 'ang', + 'zh-min-nan', 'mr', 'gu', 'lb', 'su', 'ur', 'wo', 'kn', 'ky', 'am', + 'co', ] for lang in self.languages_by_size: @@ -101,6 +101,7 @@ 'nb': 'no', 'nds': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Lo… 'qu': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Qu… + 'simple': 'en', #http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Simple_English_(3)_Wikiquote 'tk': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Tu… 'tokipona': None, 'tt': None, # http://meta.wikimedia.org/wiki/Proposals_for_closing_projects/Closure_of_Ta… Modified: branches/rewrite/pywikibot/families/wikisource_family.py =================================================================== --- branches/rewrite/pywikibot/families/wikisource_family.py 2010-03-12 09:43:56 UTC (rev 7992) +++ branches/rewrite/pywikibot/families/wikisource_family.py 2010-03-12 09:55:12 UTC (rev 7993) @@ -13,7 +13,7 @@ self.languages_by_size = [ 'en', 'zh', 'pt', 'ru', 'fr', 'es', 'de', 'it', 'he', 'ar', 'fa', 'hu', 'pl', 'th', 'cs', 'ro', 'hr', 'te', 'fi', 'tr', - 'nl', 'sv', 'sl', 'ko', 'sr', 'uk', 'ja', 'vi', 'el', 'la', + 'nl', 'sv', 'sl', 'uk', 'ko', 'sr', 'vi', 'ja', 'el', 'la', 'li', 'yi', 'ml', 'bn', 'az', 'is', 'bs', 'ca', 'hy', 'id', 'mk', 'no', 'da', 'et', 'ta', 'bg', 'lt', 'gl', 'kn', 'cy', 'sk', 'zh-min-nan', 'fo', Modified: branches/rewrite/pywikibot/families/wiktionary_family.py =================================================================== --- branches/rewrite/pywikibot/families/wiktionary_family.py 2010-03-12 09:43:56 UTC (rev 7992) +++ branches/rewrite/pywikibot/families/wiktionary_family.py 2010-03-12 09:55:12 UTC (rev 7993) @@ -12,19 +12,19 @@ self.languages_by_size = [ 'fr', 'en', 'lt', 'tr', 'zh', 'ru', 'vi', 'io', 'pl', 'pt', - 'fi', 'hu', 'no', 'el', 'ta', 'it', 'de', 'sv', 'ko', 'nl', + 'fi', 'hu', 'el', 'no', 'ta', 'de', 'it', 'sv', 'ko', 'nl', 'lo', 'kn', 'ja', 'ku', 'ar', 'es', 'ml', 'ro', 'et', 'id', 'te', 'gl', 'bg', 'uk', 'ca', 'vo', 'li', 'is', 'fa', 'sr', - 'af', 'cs', 'scn', 'th', 'sw', 'fy', 'simple', 'br', 'oc', 'he', - 'sl', 'hr', 'hy', 'sq', 'tt', 'la', 'zh-min-nan', 'da', 'tk', 'ast', - 'wa', 'ur', 'hsb', 'kk', 'ky', 'wo', 'eo', 'ang', 'hi', 'ga', - 'gn', 'az', 'ia', 'co', 'lv', 'sk', 'ka', 'ne', 'csb', 'st', - 'ms', 'tl', 'mr', 'nds', 'kl', 'eu', 'sd', 'ug', 'ti', 'cy', + 'af', 'scn', 'cs', 'th', 'sw', 'fy', 'simple', 'br', 'oc', 'he', + 'hr', 'sl', 'hy', 'sq', 'tt', 'la', 'zh-min-nan', 'da', 'tk', 'wa', + 'ast', 'ur', 'hsb', 'kk', 'ky', 'eo', 'wo', 'ang', 'lv', 'hi', + 'ga', 'gn', 'az', 'ia', 'co', 'ka', 'sk', 'ne', 'csb', 'st', + 'ms', 'tl', 'mr', 'eu', 'cy', 'nds', 'kl', 'sd', 'ug', 'ti', 'mk', 'ps', 'an', 'sh', 'my', 'bn', 'gu', 'km', 'mg', 'ts', 'qu', 'bs', 'fo', 'am', 'rw', 'chr', 'su', 'om', 'mn', 'nah', 'ie', 'yi', 'iu', 'be', 'ss', 'gd', 'tg', 'si', 'nn', 'zu', - 'kw', 'dv', 'pa', 'gv', 'mt', 'tpi', 'sg', 'roa-rup', 'mi', 'jv', - 'uz', 'ik', 'so', 'ha', 'sa', 'ay', 'na', 'jbo', 'tn', 'sm', + 'kw', 'mt', 'dv', 'pa', 'gv', 'tpi', 'sg', 'roa-rup', 'mi', 'uz', + 'jv', 'ik', 'so', 'ha', 'ay', 'sa', 'na', 'jbo', 'tn', 'sm', 'lb', 'ks', 'fj', 'ln', 'za', 'dz', 'als', ] Modified: branches/rewrite/pywikibot/family.py =================================================================== --- branches/rewrite/pywikibot/family.py 2010-03-12 09:43:56 UTC (rev 7992) +++ branches/rewrite/pywikibot/family.py 2010-03-12 09:55:12 UTC (rev 7993) @@ -1,7 +1,7 @@ # -*- coding: utf-8 -*- # -# (C) Pywikipedia bot team, 2004-2009 +# (C) Pywikipedia bot team, 2004-2010 # # Distributed under the terms of the MIT license. #

14 years, 2 months

SVN: [7992] trunk/pywikipedia/families

by xqt＠svn.wikimedia.org

Revision: 7992 Author: xqt Date: 2010-03-12 09:43:56 +0000 (Fri, 12 Mar 2010) Log Message: ----------- ipdate family files Modified Paths: -------------- trunk/pywikipedia/families/wikibooks_family.py trunk/pywikipedia/families/wikinews_family.py trunk/pywikipedia/families/wikipedia_family.py trunk/pywikipedia/families/wiktionary_family.py Modified: trunk/pywikipedia/families/wikibooks_family.py =================================================================== --- trunk/pywikipedia/families/wikibooks_family.py 2010-03-12 09:03:31 UTC (rev 7991) +++ trunk/pywikipedia/families/wikibooks_family.py 2010-03-12 09:43:56 UTC (rev 7992) @@ -11,9 +11,9 @@ self.name = 'wikibooks' self.languages_by_size = [ - 'en', 'de', 'fr', 'hu', 'pt', 'ja', 'es', 'nl', 'pl', 'it', + 'en', 'de', 'fr', 'pt', 'hu', 'ja', 'es', 'nl', 'pl', 'it', 'he', 'sq', 'fi', 'vi', 'ru', 'cs', 'hr', 'zh', 'sv', 'ca', - 'da', 'tr', 'th', 'mk', 'sr', 'tl', 'fa', 'id', 'is', 'ar', + 'da', 'tr', 'th', 'mk', 'sr', 'tl', 'fa', 'id', 'ar', 'is', 'no', 'ta', 'gl', 'ko', 'ka', 'eo', 'lt', 'bg', 'ro', 'sk', 'el', 'la', 'ia', 'ang', 'cv', 'sl', 'et', 'mr', 'ur', 'uk', 'ml', 'az', 'oc', 'ms', 'eu', 'fy', 'hi', 'ie', 'tg', 'bn', Modified: trunk/pywikipedia/families/wikinews_family.py =================================================================== --- trunk/pywikipedia/families/wikinews_family.py 2010-03-12 09:03:31 UTC (rev 7991) +++ trunk/pywikipedia/families/wikinews_family.py 2010-03-12 09:43:56 UTC (rev 7992) @@ -12,8 +12,8 @@ self.languages_by_size = [ 'sr', 'en', 'pl', 'de', 'fr', 'it', 'pt', 'es', 'zh', 'ja', - 'sv', 'ru', 'fi', 'he', 'ar', 'cs', 'sd', 'hu', 'bg', 'no', - 'ta', 'ro', 'uk', 'ca', 'tr', 'th', 'bs', + 'sv', 'ru', 'fi', 'he', 'ar', 'cs', 'sd', 'hu', 'bg', 'ro', + 'ta', 'no', 'uk', 'ca', 'tr', 'th', 'bs', ] if family.config.SSL_connection: Modified: trunk/pywikipedia/families/wikipedia_family.py =================================================================== --- trunk/pywikipedia/families/wikipedia_family.py 2010-03-12 09:03:31 UTC (rev 7991) +++ trunk/pywikipedia/families/wikipedia_family.py 2010-03-12 09:43:56 UTC (rev 7992) @@ -14,29 +14,29 @@ 'en', 'de', 'fr', 'pl', 'it', 'ja', 'nl', 'es', 'pt', 'ru', 'sv', 'zh', 'no', 'fi', 'ca', 'uk', 'hu', 'cs', 'tr', 'ro', 'ko', 'eo', 'da', 'ar', 'vo', 'id', 'vi', 'sk', 'sr', 'lt', - 'he', 'bg', 'fa', 'sl', 'hr', 'et', 'new', 'ms', 'simple', 'th', - 'gl', 'nn', 'hi', 'ht', 'eu', 'el', 'te', 'ceb', 'mk', 'la', + 'he', 'bg', 'fa', 'sl', 'hr', 'et', 'new', 'ms', 'th', 'simple', + 'gl', 'nn', 'hi', 'eu', 'ht', 'el', 'te', 'ceb', 'mk', 'la', 'ka', 'br', 'az', 'bs', 'lb', 'sh', 'is', 'mr', 'cy', 'sq', - 'lv', 'jv', 'bpy', 'tl', 'pms', 'be-x-old', 'ta', 'bn', 'oc', 'an', - 'be', 'io', 'sw', 'war', 'nds', 'scn', 'fy', 'qu', 'su', 'af', - 'zh-yue', 'gu', 'ast', 'nap', 'ku', 'ur', 'bat-smg', 'ml', 'wa', 'cv', + 'jv', 'lv', 'bpy', 'tl', 'pms', 'be-x-old', 'ta', 'bn', 'oc', 'an', + 'be', 'io', 'war', 'sw', 'nds', 'scn', 'fy', 'qu', 'su', 'af', + 'gu', 'zh-yue', 'ast', 'nap', 'ku', 'ur', 'bat-smg', 'ml', 'wa', 'cv', 'ksh', 'ga', 'lmo', 'tg', 'roa-tara', 'vec', 'hy', 'kn', 'gd', 'uz', - 'pam', 'yi', 'mi', 'zh-min-nan', 'nah', 'als', 'kk', 'sah', 'glk', 'li', + 'pam', 'yi', 'mi', 'zh-min-nan', 'kk', 'nah', 'als', 'sah', 'glk', 'li', 'hsb', 'co', 'tt', 'roa-rup', 'yo', 'ia', 'os', 'arz', 'bcl', 'gan', - 'fiu-vro', 'mn', 'nds-nl', 'vls', 'tk', 'fo', 'sa', 'am', 'dv', 'pnb', - 'nrm', 'pag', 'rm', 'ne', 'map-bms', 'bar', 'wuu', 'gv', 'my', 'diq', - 'sco', 'se', 'fur', 'lij', 'si', 'nov', 'mt', 'ug', 'bh', 'mzn', - 'csb', 'ilo', 'zh-classical', 'pi', 'km', 'lad', 'sc', 'frp', 'mg', 'ang', - 'kw', 'pdc', 'haw', 'szl', 'ps', 'ckb', 'hif', 'bo', 'pa', 'ie', + 'fiu-vro', 'mn', 'nds-nl', 'vls', 'tk', 'fo', 'sa', 'am', 'pnb', 'dv', + 'nrm', 'pag', 'ne', 'rm', 'map-bms', 'bar', 'wuu', 'gv', 'my', 'sco', + 'diq', 'se', 'fur', 'lij', 'si', 'nov', 'mt', 'ug', 'bh', 'mzn', + 'csb', 'ilo', 'zh-classical', 'pi', 'km', 'lad', 'sc', 'mg', 'frp', 'ang', + 'kw', 'pdc', 'haw', 'szl', 'ckb', 'ps', 'hif', 'bo', 'pa', 'ie', 'hak', 'kv', 'to', 'crh', 'stq', 'myv', 'gn', 'ln', 'mhr', 'nv', - 'ace', 'arc', 'jbo', 'ky', 'ext', 'wo', 'ty', 'tpi', 'eml', 'cbk-zam', + 'ace', 'arc', 'ext', 'jbo', 'ky', 'wo', 'ty', 'tpi', 'eml', 'cbk-zam', 'so', 'zea', 'kab', 'srn', 'ay', 'pap', 'or', 'ig', 'ba', 'kg', - 'lo', 'udm', 'dsb', 'rmy', 'cu', 'kaa', 'ab', 'sm', 'ce', 'xal', - 'av', 'ks', 'tet', 'got', 'kl', 'sd', 'mdf', 'na', 'bm', 'pnt', - 'mwl', 'iu', 'pih', 'pcd', 'as', 'cdo', 'chr', 'ee', 'om', 'zu', - 'ti', 'za', 'ts', 'ss', 've', 'bi', 'ha', 'dz', 'ch', 'bxr', - 'cr', 'bug', 'xh', 'tn', 'ki', 'sg', 'ik', 'rw', 'st', 'ak', - 'ny', 'tw', 'chy', 'sn', 'fj', 'ff', 'lg', 'lbe', 'tum', 'rn', + 'lo', 'udm', 'dsb', 'rmy', 'cu', 'kaa', 'ab', 'ce', 'sm', 'xal', + 'av', 'ks', 'tet', 'got', 'kl', 'sd', 'mdf', 'mwl', 'na', 'bm', + 'pnt', 'iu', 'pih', 'pcd', 'as', 'cdo', 'chr', 'ee', 'om', 'zu', + 'ti', 'ts', 'za', 'ss', 've', 'bi', 'ha', 'dz', 'cr', 'ch', + 'bxr', 'xh', 'bug', 'tn', 'ki', 'sg', 'ik', 'rw', 'st', 'ny', + 'tw', 'ak', 'fj', 'sn', 'ff', 'lg', 'lbe', 'tum', 'chy', 'rn', ] if family.config.SSL_connection: Modified: trunk/pywikipedia/families/wiktionary_family.py =================================================================== --- trunk/pywikipedia/families/wiktionary_family.py 2010-03-12 09:03:31 UTC (rev 7991) +++ trunk/pywikipedia/families/wiktionary_family.py 2010-03-12 09:43:56 UTC (rev 7992) @@ -15,16 +15,16 @@ 'fi', 'hu', 'el', 'no', 'ta', 'de', 'it', 'sv', 'ko', 'nl', 'lo', 'kn', 'ja', 'ku', 'ar', 'es', 'ml', 'ro', 'et', 'id', 'te', 'gl', 'bg', 'uk', 'ca', 'vo', 'li', 'is', 'fa', 'sr', - 'af', 'cs', 'scn', 'th', 'sw', 'fy', 'simple', 'br', 'oc', 'he', - 'sl', 'hr', 'hy', 'sq', 'tt', 'la', 'zh-min-nan', 'da', 'tk', 'wa', + 'af', 'scn', 'cs', 'th', 'sw', 'fy', 'simple', 'br', 'oc', 'he', + 'hr', 'sl', 'hy', 'sq', 'tt', 'la', 'zh-min-nan', 'da', 'tk', 'wa', 'ast', 'ur', 'hsb', 'kk', 'ky', 'eo', 'wo', 'ang', 'lv', 'hi', 'ga', 'gn', 'az', 'ia', 'co', 'ka', 'sk', 'ne', 'csb', 'st', - 'ms', 'tl', 'mr', 'eu', 'nds', 'kl', 'sd', 'ug', 'ti', 'cy', + 'ms', 'tl', 'mr', 'eu', 'cy', 'nds', 'kl', 'sd', 'ug', 'ti', 'mk', 'ps', 'an', 'sh', 'my', 'bn', 'gu', 'km', 'mg', 'ts', 'qu', 'bs', 'fo', 'am', 'rw', 'chr', 'su', 'om', 'mn', 'nah', 'ie', 'yi', 'iu', 'be', 'ss', 'gd', 'tg', 'si', 'nn', 'zu', - 'mt', 'kw', 'dv', 'pa', 'gv', 'tpi', 'sg', 'roa-rup', 'mi', 'jv', - 'uz', 'ik', 'so', 'ha', 'ay', 'sa', 'na', 'jbo', 'tn', 'sm', + 'kw', 'mt', 'dv', 'pa', 'gv', 'tpi', 'sg', 'roa-rup', 'mi', 'uz', + 'jv', 'ik', 'so', 'ha', 'ay', 'sa', 'na', 'jbo', 'tn', 'sm', 'lb', 'ks', 'fj', 'ln', 'za', 'dz', 'als', ]

14 years, 2 months

SVN: [7991] trunk/pywikipedia

by xqt＠svn.wikimedia.org

Revision: 7991 Author: xqt Date: 2010-03-12 09:03:31 +0000 (Fri, 12 Mar 2010) Log Message: ----------- site.getmagicwords() from site.siteinfo() instead from family file Modified Paths: -------------- trunk/pywikipedia/family.py trunk/pywikipedia/wikipedia.py Modified: trunk/pywikipedia/family.py =================================================================== --- trunk/pywikipedia/family.py 2010-03-12 08:58:10 UTC (rev 7990) +++ trunk/pywikipedia/family.py 2010-03-12 09:03:31 UTC (rev 7991) @@ -1,9 +1,17 @@ # -*- coding: utf-8 -*- -import config, urllib, re -from datetime import timedelta, datetime +# +# (C) Pywikipedia bot team, 2004-2010 +# +# Distributed under the terms of the MIT license. +# __version__='$Id$' +import config +import re +import urllib +from datetime import timedelta, datetime + # Parent class for all wiki families class Family: @@ -2678,8 +2686,8 @@ }, } - # letters that can follow a wikilink and are regarded as part - # of this link + # letters that can follow a wikilink and are regarded as part of + # this link # This depends on the linktrail setting in LanguageXx.php and on # [[MediaWiki:Linktrail]]. # Note: this is a regular expression. @@ -3113,7 +3121,9 @@ # A list with the name for cross-project cookies. # default for wikimedia centralAuth extensions. - self.cross_projects_cookies = ['centralauth_Session', 'centralauth_Token', 'centralauth_User'] + self.cross_projects_cookies = ['centralauth_Session', + 'centralauth_Token', + 'centralauth_User'] self.cross_projects_cookie_username = 'centralauth_User' # A list with the name in the cross-language flag permissions @@ -3449,51 +3459,6 @@ def category_namespaces(self, code): return self.namespace(code, 14, all = True) - # So can be pagename code - pagename = { - 'bg': [u'СТРАНИЦА'], - 'he': [u'שם הדף'], - 'kk': [u'БЕТАТАУЫ'], - 'nn': ['SIDENAMN', 'SIDENAVN'], - 'ru': [u'НАЗВАНИЕСТРАНИЦЫ'], - 'sr': [u'СТРАНИЦА'], - 'tt': [u'BİTİSEME'] - } - - pagenamee = { - 'he': [u'שם הדף מקודד'], - 'kk': [u'БЕТАТАУЫ2'], - 'nn': ['SIDENAMNE', 'SIDENAVNE'], - 'ru': [u'НАЗВАНИЕСТРАНИЦЫ2'], - 'sr': [u'СТРАНИЦЕ'] - } - - def pagenamecodes(self, code): - pos = ['PAGENAME'] - pos2 = [] - if code in self.pagename: - pos = pos + self.pagename[code] - elif code == 'als': - return self.pagenamecodes('de') - elif code == 'bm': - return self.pagenamecodes('fr') - for p in pos: - pos2 += [p, p.lower()] - return pos2 - - def pagename2codes(self, code): - pos = ['PAGENAME'] - pos2 = [] - if code in self.pagenamee: - pos = pos + self.pagenamee[code] - elif code == 'als': - return self.pagename2codes('de') - elif code == 'bm': - return self.pagename2codes('fr') - for p in pos: - pos2 += [p, p.lower()] - return pos2 - # Methods def protocol(self, code): """ Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2010-03-12 08:58:10 UTC (rev 7990) +++ trunk/pywikipedia/wikipedia.py 2010-03-12 09:03:31 UTC (rev 7991) @@ -2156,7 +2156,7 @@ text = self.get() # Replace {{PAGENAME}} by its value - for pagenametext in self.site().family.pagenamecodes( + for pagenametext in self.site().pagenamecodes( self.site().language()): text = text.replace(u"{{%s}}" % pagenametext, self.title()) @@ -2363,8 +2363,8 @@ # {{#if: }} if name.startswith('#'): continue - # {{DEFAULTSORT:...}} or {{#if: }} - defaultKeys = self.site().siteinfo('magicwords')['defaultsort'] + # {{DEFAULTSORT:...}} + defaultKeys = self.site().getmagicwords('defaultsort') found = False for key in defaultKeys: if name.startswith(key): @@ -6757,19 +6757,18 @@ return True return False - def redirect(self, default = False): + def getmagicwords(self, word): + """Return list of localized "word" magic words for the site.""" + return self.siteinfo('magicwords').get(word) + + def redirect(self, default=False): """Return the localized redirect tag for the site. - If default is True, falls back to 'REDIRECT' if the site has no - special redirect tag. + Argument is ignored (but maintained for backwards-compatibility). """ - tag = self.siteinfo('magicwords').get('redirect') - if tag: - # remove first "#" letter - return tag[0][1:] - elif default: - return u'REDIRECT' + # return the magic word without the preceding '#' character + return self.getmagicwords('redirect')[0].lstrip("#") def redirectRegex(self): """Return a compiled regular expression matching on redirect pages. @@ -6780,7 +6779,7 @@ #NOTE: this is needed, since the API can give false positives! default = 'REDIRECT' try: - keywords = self.siteinfo('magicwords')['redirect'] + keywords = self.getmagicwords('redirect') pattern = r'(?:' + '|'.join(keywords) + ')' except KeyError: # no localized keyword for redirects @@ -6797,6 +6796,14 @@ + '\s*:?\s*\[\[(.+?)(?:\|.*?)?\]\]', re.IGNORECASE | re.UNICODE | re.DOTALL) + def pagenamecodes(self, default=True): + """Return list of localized PAGENAME tags for the site.""" + return self.getmagicwords('pagename') + + def pagename2codes(self, default=True): + """Return list of localized PAGENAMEE tags for the site.""" + return self.getmagicwords('pagenamee') + def resolvemagicwords(self, wikitext): """Replace the {{ns:xx}} marks in a wikitext with the namespace names"""

14 years, 2 months

SVN: [7990] branches/rewrite/pywikibot

by xqt＠svn.wikimedia.org

Revision: 7990 Author: xqt Date: 2010-03-12 08:58:10 +0000 (Fri, 12 Mar 2010) Log Message: ----------- ignore edit conficts at throttle.ctrl Modified Paths: -------------- branches/rewrite/pywikibot/site.py branches/rewrite/pywikibot/throttle.py Modified: branches/rewrite/pywikibot/site.py =================================================================== --- branches/rewrite/pywikibot/site.py 2010-03-11 19:16:15 UTC (rev 7989) +++ branches/rewrite/pywikibot/site.py 2010-03-12 08:58:10 UTC (rev 7990) @@ -4,7 +4,7 @@ on the same topic in different languages). """ # -# (C) Pywikipedia bot team, 2008 +# (C) Pywikipedia bot team, 2008-2010 # # Distributed under the terms of the MIT license. # @@ -876,7 +876,7 @@ def redirect(self, default=True): """Return the preferred localized #REDIRECT keyword. - Argument is ignored (but maintained for backwards-compatibility. + Argument is ignored (but maintained for backwards-compatibility). """ # return the magic word without the preceding '#' character @@ -888,8 +888,7 @@ Group 1 in the regex match object will be the target title. """ - #TODO: is this needed, since the API identifies redirects? - # (maybe, the API can give false positives) + #NOTE: this is needed, since the API can give false positives! try: keywords = set(s.lstrip("#") for s in self.getmagicwords("redirect")) Modified: branches/rewrite/pywikibot/throttle.py =================================================================== --- branches/rewrite/pywikibot/throttle.py 2010-03-11 19:16:15 UTC (rev 7989) +++ branches/rewrite/pywikibot/throttle.py 2010-03-12 08:58:10 UTC (rev 7990) @@ -47,6 +47,8 @@ if self.maxdelay is None: self.maxdelay = config.maxthrottle self.writedelay = writedelay + if self.writedelay is None: + self.writedelay = config.put_throttle self.last_read = 0 self.last_write = 0 self.next_multiplicity = 1.0 @@ -56,8 +58,10 @@ self.releasepid = 1200 # Free the process id after this many seconds self.lastwait = 0.0 self.delay = 0 + self.checktime = 0 self.verbosedelay = verbosedelay - if multiplydelay: + self.multiplydelay = multiplydelay + if self.multiplydelay: self.checkMultiplicity() self.setDelays() @@ -95,8 +99,8 @@ if now - ptime > self.releasepid: continue # process has expired, drop from file if now - ptime <= self.dropdelay \ - and this_site == mysite \ - and this_pid != pid: + and this_site == mysite \ + and this_pid != pid: count += 1 if this_site != self.mysite or this_pid != pid: processes.append({'pid': this_pid, @@ -111,15 +115,18 @@ processes.append({'pid': pid, 'time': self.checktime, 'site': mysite}) - f = open(self.ctrlfilename, 'w') processes.sort(key=lambda p:(p['pid'], p['site'])) - for p in processes: - f.write("%(pid)s %(time)s %(site)s\n" % p) + try: + f = open(self.ctrlfilename, 'w') + for p in processes: + f.write("%(pid)s %(time)s %(site)s\n" % p) + except IOError: + pass f.close() self.process_multiplicity = count if self.verbosedelay: pywikibot.output( -u"Found %(count)s %(mysite)s processes running, including this one." + u"Found %(count)s %(mysite)s processes running, including this one." % locals()) finally: self.lock.release() @@ -156,7 +163,7 @@ thisdelay = self.writedelay else: thisdelay = self.delay - if pid: # If set, we're checking for multiple processes + if pid and self.multiplydelay: # We're checking for multiple processes if time.time() > self.checktime + self.checkdelay: self.checkMultiplicity() if thisdelay < (self.mindelay * self.next_multiplicity): @@ -203,14 +210,17 @@ continue # Sometimes the file gets corrupted # ignore that line if now - ptime <= self.releasepid \ - and this_pid != pid: + and this_pid != pid: processes.append({'pid': this_pid, 'time': ptime, 'site': this_site}) - f = open(self.ctrlfilename, 'w') processes.sort(key=lambda p:p['pid']) - for p in processes: - f.write("%(pid)s %(time)s %(site)s\n" % p) + try: + f = open(self.ctrlfilename, 'w') + for p in processes: + f.write("%(pid)s %(time)s %(site)s\n" % p) + except IOError: + pass f.close() def __call__(self, requestsize=1, write=False): @@ -235,10 +245,10 @@ # Announce the delay if it exceeds a preset limit if wait > config.noisysleep: pywikibot.output(u"Sleeping for %(wait).1f seconds, %(now)s" - % {'wait': wait, - 'now': time.strftime("%Y-%m-%d %H:%M:%S", + % {'wait': wait, + 'now' : time.strftime("%Y-%m-%d %H:%M:%S", time.localtime()) - } ) + } ) time.sleep(wait) if write: self.last_write = time.time() @@ -264,11 +274,11 @@ if wait > 0: if wait > config.noisysleep: pywikibot.output( - u"Sleeping for %(wait).1f seconds, %(now)s" - % {'wait': wait, - 'now': time.strftime("%Y-%m-%d %H:%M:%S", - time.localtime()) - } ) + u"Sleeping for %(wait).1f seconds, %(now)s" + % {'wait': wait, + 'now': time.strftime("%Y-%m-%d %H:%M:%S", + time.localtime()) + } ) time.sleep(wait) finally: self.lock.release()

14 years, 2 months

SVN: [7989] branches/rewrite/pywikibot

by russblau＠svn.wikimedia.org

Revision: 7989 Author: russblau Date: 2010-03-11 19:16:15 +0000 (Thu, 11 Mar 2010) Log Message: ----------- Get magic word localizations from the API instead of storing them in family files. Modified Paths: -------------- branches/rewrite/pywikibot/family.py branches/rewrite/pywikibot/site.py Modified: branches/rewrite/pywikibot/family.py =================================================================== --- branches/rewrite/pywikibot/family.py 2010-03-11 17:44:03 UTC (rev 7988) +++ branches/rewrite/pywikibot/family.py 2010-03-11 19:16:15 UTC (rev 7989) @@ -490,7 +490,9 @@ # A list with the name for cross-project cookies. # default for wikimedia centralAuth extensions. - self.cross_projects_cookies = ['centralauth_Session', 'centralauth_Token', 'centralauth_User'] + self.cross_projects_cookies = ['centralauth_Session', + 'centralauth_Token', + 'centralauth_User'] self.cross_projects_cookie_username = 'centralauth_User' # A list with the name in the cross-language flag permissions @@ -676,226 +678,9 @@ return self.disambiguationTemplates[fallback] else: raise KeyError( - "ERROR: title for disambig template in language %(language_code)s unknown" +"ERROR: title for disambig template in language %(language_code)s unknown" % {'language_code': code}) - # Localised magic words for language code 'xyz' can be found in - # the MediaWiki source code in the file - # /mediawiki/trunk/phase3/languages/messages/MessagesXyz.php - # in the 'magicwords' array - - # Localised redirect codes - - # Note that redirect codes are case-insensitive, so it is enough - # to enter the code in lowercase here. - - # When creating a redirect page, only the first item is looked for. - # When matching for redirects, default 'redirect' is always inserted - # => if default redirect keyword used for a language is not 'redirect', - # it is not necessary to add 'redirect' at the end of the list - redirect = { - 'ab': [u'перенаправление', u'перенапр', u'redirect'], - 'ace': [u'alih'], - 'af': [u'aanstuur'], - 'aln': [u'ridrejto'], - 'als': [u'weiterleitung'], - 'an': [u'redirección'], - 'ar': [u'تحويل'], - 'arn': [u'redirección'], - 'arz': [u'تحويل'], - 'av': [u'перенаправление', u'перенапр'], - 'ay': [u'redirección'], - 'ba': [u'перенаправление', u'перенапр'], - 'bar': [u'weiterleitung'], - 'bat-smg': [u'peradresavimas'], - 'bcc': [u'تغییرمسیر'], - 'be-tarask': [u'перанакіраваньне'], - 'be-x-old': [u'перанакіраваньне'], - 'bg': [u'виж', u'пренасочване'], - 'bm': [u'redirection'], - 'bqi': [u'تغییرمسیر'], - 'br': [u'adkas'], - 'bug': [u'alih'], - 'bs': [u'preusmjeri'], - 'cbk-zam': [u'redirección'], - 'ce': [u'перенаправление', u'перенапр'], - 'cs': [u'přesměruj'], - 'cu': [u'прѣнаправлєниѥ'], - 'cv': [u'перенаправление', u'перенапр'], - 'cy': [u'ail-cyfeirio', u'ailgyfeirio'], - 'de': [u'weiterleitung'], - 'de-at': [u'weiterleitung'], - 'de-ch': [u'weiterleitung'], - 'de-formal': [u'weiterleitung'], - 'dsb': [u'weiterleitung'], - 'el': [u'ανακατευθυνση'], - 'eml': [u'rinvia', u'rinvio'], - 'eo': [u'alidirektu'], - 'es': [u'redirección'], - 'et': [u'suuna'], - 'eu': [u'birzuzendu'], - 'fa': [u'تغییرمسیر'], - 'ff': [u'redirection'], - 'fi': [u'ohjaus', u'uudelleenohjaus'], - 'fiu-vro': [u'saadaq'], - 'fr': [u'redirection'], - 'frp': [u'redirèccion', u'redirection'], - 'fur': [u'rinvia', u'rinvio'], - 'ga': [u'athsheoladh'], - 'gag': [u'yönlendirme'], - 'gl': [u'redirección'], - 'glk': [u'تغییرمسیر'], - 'gn': [u'redirección'], - 'gsw': [u'weiterleitung'], - 'he': [u'הפניה'], - 'hr': [u'preusmjeri'], - 'hsb': [u'weiterleitung'], - 'ht': [u'redirection'], - 'hu': [u'átirányítás'], - 'hy': [u'վերահղում'], - 'id': [u'alih'], - 'inh': [u'перенаправление', u'перенапр'], - 'is': [u'tilvísun'], - 'it': [u'rinvia', u'rinvio'], - 'ja': [u'転送', u'リダイレクト'], - 'jv': [u'alih'], - 'ka': [u'გადამისამართება'], - 'kaa': [u'aýdaw', u'айдау'], - 'kk': [u'айдау'], - 'kk-arab': [u'ايداۋ'], - 'kk-cyrl': [u'АЙДАУ'], - 'kk-latn': [u'aýdaw', u'айдау'], - 'km': [u'\u1794\u1789\u17d2\u1787\u17bc\u1793\u1794\u1793\u17d2\u178f', - u'\u1794\u17d2\u178f\u17bc\u179a\u1791\u17b8\u178f\u17b6\u17c6\u1784', - u'\u1794\u17d2\u178a\u17bc\u179a\u1785\u17c6\u178e\u1784\u1787\u17be\u1784', - u'ប្តូរទីតាំងទៅ'], - 'ko': [u'넘겨주기'], - 'ksh': [u'ömleide op', u'ömleidung'], - 'kv': [u'перенаправление', u'перенапр'], - 'lad': [u'redirección'], - 'lb': [u'weiterleitung'], - 'lbe': [u'перенаправление', u'перенапр'], - 'li': [u'doorverwijzing'], - 'lij': [u'rinvia', u'rinvio'], - 'lld': [u'rinvia', u'rinvio'], - 'lmo': [u'rinvia', u'rinvio'], - 'ln': [u'redirection'], - 'lt': [u'peradresavimas'], - 'map-bms': [u'alih'], - 'mg': [u'redirection'], - 'mhr': [u'перенаправление', u'перенапр'], - 'mk': [u'пренасочување', u'види'], - 'ml': [u'തിരിച്ചുവിടുക', u'തിരിച്ചുവിടല്‍'], - 'mo': [u'redirecteaza'], - 'mr': [u'पुनर्निर्देशन'], - 'mt': [u'rindirizza'], - 'mwl': [u'ancaminar'], - 'myv': [u'перенаправление', u'перенапр'], - 'mzn': [u'تغییرمسیر'], - 'nah': [u'redirección'], - 'nap': [u'rinvia'], - 'nds': [u'wiederleiden', u'weiterleitung'], - 'nds-nl': [u'deurverwiezing', u'doorverwijzing'], - 'new': [u'पुनर्निर्देश'], - 'nl': [u'doorverwijzing'], - 'nn': [u'omdiriger'], - 'no': [u'omdirigering'], - 'oc': [u'redireccion'], - 'os': [u'рарвыст', u'перенаправление', u'перенапр'], - 'pdc': [u'weiterleitung'], - 'pl': [u'patrz', u'przekieruj', u'tam'], - 'pms': [u'rinvia', u'rinvio'], - 'pt': [u'redirecionamento'], - 'pt-br': [u'redirecionamento'], - 'qu': [u'pusapuna', u'redirección'], - 'rmy': [u'redirecteaza'], - 'ro': [u'redirecteaza'], - 'ru': [u'перенаправление', u'перенапр'], - 'sa': [u'पुनर्निदेशन'], - 'sah': [u'перенаправление', u'перенапр'], - 'scn': [u'rinvia', u'rinvio'], - 'sd': [u'چوريو'], - 'sg': [u'redirection'], - 'shi': [u'تحويل'], - 'si': [u'යළියොමුව'], - 'sk': [u'presmeruj'], - 'sl': [u'preusmeritev'], - 'sli': [u'weiterleitung'], - 'sq': [u'ridrejto'], - 'sr': [u'преусмери', u'преусмери'], - 'sr-ec': [u'преусмери'], - 'sr-el': [u'preusmeri'], - 'srn': [u'stir', u'doorverwijzing'], - 'stq': [u'weiterleitung'], - 'su': [u'alih'], - 'sv': [u'omdirigering'], - 'szl': [u'patrz', u'przekieruj', u'tam'], - 'ta': [u'வழிமாற்று'], - 'te': [u'దారిమార్పు'], - 'th': [u'เปลี่ยนทาง'], - 'tr': [u'yönlendirme'], - 'tt': [u'yünältü'], - 'tt-latn': [u'yünältü'], - 'tt-cyrl': [u'перенаправление', u'перенапр'], - 'ty': [u'redirection'], - 'udm': [u'перенаправление', u'перенапр'], - 'uk': [u'перенаправлення', u'перенаправление', u'перенапр'], - 'vec': [u'rinvia', u'rinvio'], - 'vep': [u'suuna'], - 'vi': [u'đổi', u'đổi'], - 'vls': [u'doorverwijzing'], - 'vro': [u'saadaq', u'suuna'], - 'wa': [u'redirection'], - 'wo': [u'redirection'], - 'yi': [u'ווייטערפירן', u'הפניה'], - 'zea': [u'doorverwijzing'] - } - - # So can be pagename code - pagename = { - 'bg': [u'СТРАНИЦА'], - 'he': [u'שם הדף'], - 'kk': [u'БЕТАТАУЫ'], - 'nn': ['SIDENAMN', 'SIDENAVN'], - 'ru': [u'НАЗВАНИЕСТРАНИЦЫ'], - 'sr': [u'СТРАНИЦА'], - 'tt': [u'BİTİSEME'] - } - - pagenamee = { - 'he': [u'שם הדף מקודד'], - 'kk': [u'БЕТАТАУЫ2'], - 'nn': ['SIDENAMNE', 'SIDENAVNE'], - 'ru': [u'НАЗВАНИЕСТРАНИЦЫ2'], - 'sr': [u'СТРАНИЦЕ'] - } - - def pagenamecodes(self, code): - pos = ['PAGENAME'] - pos2 = [] - if code in self.pagename: - pos = pos + self.pagename[code] - elif code == 'als': - return self.pagenamecodes('de') - elif code == 'bm': - return self.pagenamecodes('fr') - for p in pos: - pos2 += [p, p.lower()] - return pos2 - - def pagename2codes(self, code): - pos = ['PAGENAME'] - pos2 = [] - if code in self.pagenamee: - pos = pos + self.pagenamee[code] - elif code == 'als': - return self.pagename2codes('de') - elif code == 'bm': - return self.pagename2codes('fr') - for p in pos: - pos2 += [p, p.lower()] - return pos2 - # Methods def protocol(self, code): """ Modified: branches/rewrite/pywikibot/site.py =================================================================== --- branches/rewrite/pywikibot/site.py 2010-03-11 17:44:03 UTC (rev 7988) +++ branches/rewrite/pywikibot/site.py 2010-03-11 19:16:15 UTC (rev 7989) @@ -261,17 +261,22 @@ normalizeNamespace = ns_normalize # for backwards-compatibility def redirect(self, default=True): - """Return the localized redirect tag for the site. + """Return list of localized redirect tags for the site. If default is True, falls back to 'REDIRECT' if the site has no special redirect tag. """ - if default: - return self.family.redirect.get(self.code, [u"REDIRECT"])[0] - else: - return self.family.redirect.get(self.code, None) + return [u"REDIRECT"] + def pagenamecodes(self, default=True): + """Return list of localized PAGENAME tags for the site.""" + return [u"PAGENAME"] + + def pagename2codes(self, default=True): + """Return list of localized PAGENAMEE tags for the site.""" + return [u"PAGENAMEE"] + def lock_page(self, page, block=True): """Lock page for writing. Must be called before writing any page. @@ -335,22 +340,14 @@ """ return (pywikibot.Link(s, self).site != self) - def redirectRegex(self): + def redirectRegex(self, pattern=None): """Return a compiled regular expression matching on redirect pages. Group 1 in the regex match object will be the target title. """ - #TODO: is this needed, since the API identifies redirects? - # (maybe, the API can give false positives) - default = 'REDIRECT' - try: - keywords = set(self.family.redirect[self.code]) - keywords.add(default) - pattern = r'(?:' + '|'.join(keywords) + ')' - except KeyError: - # no localized keyword for redirects - pattern = r'%s' % default + if pattern is None: + pattern = "REDIRECT" # A redirect starts with hash (#), followed by a keyword, then # arbitrary stuff, then a wikilink. The wikilink may contain # a label, although this is not useful. @@ -847,6 +844,70 @@ ts = self.getcurrenttimestamp() return pywikibot.Timestamp.fromtimestampformat(ts) + def getmagicwords(self, word): + """Return list of localized "word" magic words for the site.""" + if not hasattr(self, "_magicwords"): + sirequest = api.Request( + site=self, + action="query", + meta="siteinfo", + siprop="magicwords" + ) + try: + sidata = sirequest.submit() + assert 'query' in sidata, \ + "API siteinfo response lacks 'query' key" + sidata = sidata['query'] + assert 'magicwords' in sidata, \ + "API siteinfo response lacks 'magicwords' key" + self._magicwords = dict((item["name"], item["aliases"]) + for item in sidata["magicwords"]) + + except api.APIError: + # hack for older sites that don't support 1.13 properties + # probably should delete if we're not going to support pre-1.13 + self._magicwords = {} + + if word in self._magicwords: + return self._magicwords[word] + else: + return [word] + + def redirect(self, default=True): + """Return the preferred localized #REDIRECT keyword. + + Argument is ignored (but maintained for backwards-compatibility. + + """ + # return the magic word without the preceding '#' character + return self.getmagicwords("redirect")[0].lstrip("#") + + def redirectRegex(self): + """Return a compiled regular expression matching on redirect pages. + + Group 1 in the regex match object will be the target title. + + """ + #TODO: is this needed, since the API identifies redirects? + # (maybe, the API can give false positives) + try: + keywords = set(s.lstrip("#") + for s in self.getmagicwords("redirect")) + keywords.add("REDIRECT") # just in case + pattern = "(?:" + "|".join(keywords) + ")" + except KeyError: + # no localized keyword for redirects + pattern = None + return BaseSite.redirectRegex(self, pattern) + + def pagenamecodes(self, default=True): + """Return list of localized PAGENAME tags for the site.""" + return self.getmagicwords("pagename") + + def pagename2codes(self, default=True): + """Return list of localized PAGENAMEE tags for the site.""" + return self.getmagicwords("pagenamee") + def _getsiteinfo(self): """Retrieve siteinfo and namespaces from site.""" sirequest = api.Request(

14 years, 2 months

SVN: [7988] trunk/pywikipedia

by xqt＠svn.wikimedia.org

Revision: 7988 Author: xqt Date: 2010-03-11 17:44:03 +0000 (Thu, 11 Mar 2010) Log Message: ----------- test api with new has_api() method; move throttle.log to contol file Modified Paths: -------------- trunk/pywikipedia/wikipedia.py Property Changed: ---------------- trunk/pywikipedia/pywikibot/ Property changes on: trunk/pywikipedia/pywikibot ___________________________________________________________________ Modified: svn:ignore - *.pyc + *.pyc *.ctrl Modified: trunk/pywikipedia/wikipedia.py =================================================================== --- trunk/pywikipedia/wikipedia.py 2010-03-11 15:01:00 UTC (rev 7987) +++ trunk/pywikipedia/wikipedia.py 2010-03-11 17:44:03 UTC (rev 7988) @@ -4144,12 +4144,13 @@ self.releasepid = 1200 # Free the process id self.lastwait = 0.0 self.delay = 0 - if multiplydelay: + self.multiplydelay = multiplydelay + if self.multiplydelay: self.checkMultiplicity() self.setDelay(mindelay) def logfn(self): - return config.datafilepath('logs', 'throttle.log') + return config.datafilepath('pywikibot', 'throttle.ctrl') def checkMultiplicity(self): self.lock.acquire() @@ -4211,7 +4212,7 @@ def getDelay(self): thisdelay = self.delay - if self.pid: # If self.pid, we're checking for multiple processes + if self.multiplydelay: # If self.pid, we're checking for multiple processes if time.time() > self.checktime + self.checkdelay: self.checkMultiplicity() if thisdelay < (self.mindelay * self.next_multiplicity): @@ -4595,6 +4596,7 @@ mediawiki_message: Retrieve the text of a specified MediaWiki message has_mediawiki_message: True if this site defines specified MediaWiki message + has_api: True if this site's family provides api interface shared_image_repository: Return tuple of image repositories used by this site. @@ -5677,21 +5679,13 @@ """Return the MediaWiki message text for key "key" """ # Allmessages is retrieved once for all per created Site object if (not self._mediawiki_messages) or forceReload: - api = False + api = self.has_api() if verbose: output(u"Retrieving mediawiki messages from Special:Allmessages") # Only MediaWiki r27393/1.12 and higher support XML output for Special:Allmessages if self.versionnumber() < 12: usePHP = True else: - try: - if config.use_api: - x = self.api_address() - del x - api = True - except NotImplementedError: - api = False - usePHP = False elementtree = True try: @@ -5797,6 +5791,17 @@ return True except KeyError: return False + + def has_api(self): + """Return True if this sites family has api interface.""" + try: + if config.use_api: + x = self.apipath() + del x + return True + except NotImplementedError: + pass + return False def _load(self, sysop = False, force = False): """ @@ -5814,16 +5819,10 @@ if verbose: output(u'Getting information for site %s' % self) - try: - api_url = self.api_address() - del api_url - except NotImplementedError: - config.use_api = False - # Get data # API Userinfo is available from version 1.11 # preferencetoken available from 1.14 - if config.use_api and self.versionnumber() >= 11: + if self.has_api() and self.versionnumber() >= 11: #Query userinfo params = { 'action': 'query', @@ -5860,66 +5859,47 @@ Use API when enabled use_api and version >= 1.11, or use Special:Search. """ - try: - if config.use_api and self.versionnumber() >= 11: - apiUrl = self.site().api_address() - del apiUrl - else: - raise NotImplementedError - except NotImplementedError: - _search = self._search_without_api + if self.has_api() and self.versionnumber() >= 11: + #Yield search results (using api) for query. + params = { + 'action': 'query', + 'list': 'search', + 'srsearch': q, + 'srlimit': number + } + if namespaces: + params['srnamespace'] = namespaces + + offset = 0 + while True: + params['sroffset'] = offset + data = query.GetData(params, self)['query'] + if 'error' in data: + raise RuntimeError('%s' % data['error']) + if not data['search']: + break + for s in data['search']: + offset += 1 + page = Page(self, s['title']) + yield page, s['snippet'], '', s['size'], s['wordcount'], s['timestamp'] else: - _search = self._search_with_api - return _search(query, number, namespaces) + #Yield search results (using Special:Search page) for query. + throttle = True + path = self.search_address(urllib.quote_plus(query.encode('utf-8')), + n=number, ns=namespaces) + get_throttle() + html = self.getUrl(path) + entryR = re.compile(ur'<li><a href=".+?" title="(?P<title>.+?)">.+?</a>', + re.DOTALL) + for m in entryR.finditer(html): + page = Page(self, m.group('title')) + yield page, '', '', '', '', '' - def _search_with_api(self, q, number, namespaces): - """Yield search results (using api) for query.""" - params = { - 'action': 'query', - 'list': 'search', - 'srsearch': q, - 'srlimit': number - } - if namespaces: - params['srnamespace'] = namespaces - - offset = 0 - while True: - params['sroffset'] = offset - data = query.GetData(params, self)['query'] - if 'error' in data: - raise RuntimeError('%s' % data['error']) - if not data['search']: - break - for s in data['search']: - offset += 1 - page = Page(self, s['title']) - yield page, s['snippet'], '', s['size'], s['wordcount'], s['timestamp'] - - def _search_without_api(self, query, number, namespaces): - """Yield search results (using Special:Search page) for query.""" - throttle = True - path = self.search_address(urllib.quote_plus(query.encode('utf-8')), - n=number, ns=namespaces) - get_throttle() - html = self.getUrl(path) - - entryR = re.compile(ur'<li><a href=".+?" title="(?P<title>.+?)">.+?</a>', - re.DOTALL) - - for m in entryR.finditer(html): - page = Page(self, m.group('title')) - yield page, '', '', '', '', '' - # TODO: avoid code duplication for the following methods def logpages(self, number=50, mode='', user=None, repeat=False, namespace=[], offset=-1): - if config.use_api: - apiURL = self.api_address() - del apiURL - else: - raise NotImplementedError - if mode not in ('block', 'protect', 'rights', 'delete', 'upload', + if not self.has_api() or \ + mode not in ('block', 'protect', 'rights', 'delete', 'upload', 'move', 'import', 'patrol', 'merge', 'suppress', 'review', 'stable', 'gblblock', 'renameuser', 'globalauth', 'gblrights', 'abusefilter', 'newusers'): @@ -5986,14 +5966,9 @@ # should use both offset and limit parameters, and have an # option to fetch older rather than newer pages seen = set() - try: - d = self.apipath() - del d - except NotImplementedError: - config.use_api = False - + api = self.has_api() while True: - if config.use_api and self.versionnumber() >= 10: + if api and self.versionnumber() >= 10: params = { 'action': 'query', 'list': 'recentchanges', @@ -6668,18 +6643,12 @@ """Yield Pages from results of Special:Linksearch for 'siteurl'.""" cache = [] R = re.compile('title ?=\"([^<>]*?)\">[^<>]*</a></li>') - #Check API can work - if config.use_api: - try: - d = self.api_address() - del d - except NotImplementedError: - config.use_api = False - + api = self.has_api() urlsToRetrieve = [siteurl] if not siteurl.startswith('*.'): urlsToRetrieve.append('*.' + siteurl) - if config.use_api and self.versionnumber() >= 11: + + if api and self.versionnumber() >= 11: output(u'Querying API exturlusage...') for url in urlsToRetrieve: params = {

14 years, 2 months

SVN: [7987] branches/rewrite/scripts/category_redirect.py

by russblau＠svn.wikimedia.org

Revision: 7987 Author: russblau Date: 2010-03-11 15:01:00 +0000 (Thu, 11 Mar 2010) Log Message: ----------- Always "touch" redirected category pages so that any automatically generated categories can update. Modified Paths: -------------- branches/rewrite/scripts/category_redirect.py Modified: branches/rewrite/scripts/category_redirect.py =================================================================== --- branches/rewrite/scripts/category_redirect.py 2010-03-11 14:54:20 UTC (rev 7986) +++ branches/rewrite/scripts/category_redirect.py 2010-03-11 15:01:00 UTC (rev 7987) @@ -320,10 +320,6 @@ global destmap, catlist, catmap user = self.site.user() - redirect_magicwords = ["redirect"] - other_words = self.site.redirect() - if other_words: - redirect_magicwords.extend(other_words) problems = [] newredirs = [] @@ -482,8 +478,8 @@ problems.append("# %s redirects to %s" % (cat.title(asLink=True, textlink=True), dest.title(asLink=True, textlink=True))) - # do a null edit on cat to make it appear in the - # "needs repair" category (if this wiki has one) + # do a null edit on cat to update any special redirect + # categories this wiki might maintain try: cat.put(cat.get(get_redirect=True)) except: @@ -495,6 +491,11 @@ self.log_text.append(u"* Redirect loop from %s" % dest.title(asLink=True, textlink=True)) + # do a null edit on cat + try: + cat.put(cat.get(get_redirect=True)) + except: + pass else: self.log_text.append( u"* Fixed double-redirect: %s -> %s -> %s" @@ -531,6 +532,12 @@ u"* [[:%s%s]]: %d found, %d moved" % (self.catprefix, cat_title, found, moved)) counts[cat_title] = found + # do a null edit on cat + try: + cat.put(cat.get(get_redirect=True)) + except: + pass + continue cPickle.dump(record, open(datafile, "wb"), -1)

14 years, 2 months

SVN: [7986] branches/rewrite/scripts/solve_disambiguation.py

by russblau＠svn.wikimedia.org

Revision: 7986 Author: russblau Date: 2010-03-11 14:54:20 +0000 (Thu, 11 Mar 2010) Log Message: ----------- Merge recent changes from trunk. Modified Paths: -------------- branches/rewrite/scripts/solve_disambiguation.py Modified: branches/rewrite/scripts/solve_disambiguation.py =================================================================== --- branches/rewrite/scripts/solve_disambiguation.py 2010-03-10 15:45:02 UTC (rev 7985) +++ branches/rewrite/scripts/solve_disambiguation.py 2010-03-11 14:54:20 UTC (rev 7986) @@ -27,6 +27,9 @@ -just only use the alternatives given on the command line, do not read the page for other possibilities + -dnskip Skip links already marked with a disambiguation-needed + template (e.g., {{dn}}) + -primary "primary topic" disambiguation (Begriffsklärung nach Modell 2). That's titles where one topic is much more important, the disambiguation page is saved somewhere else, and the important @@ -55,7 +58,7 @@ wiki that is defined (to the bot) as the category containing disambiguation pages, starting at XY. If only '-start' or '-start:' is given, it starts at the beginning. - + -min:XX (XX being a number) only work on disambiguation pages for which at least XX are to be worked on. @@ -191,6 +194,21 @@ 'uk': u'Виправлення посилання на багатозначність за допомогою бота: %s вилучено', } +# Disambiguation Needed template +dn_template = { + 'en' : u'{{dn}}', + } + +# Summary message when adding Disambiguation Needed template +msg_dn = { + 'en' : u'Robot-assisted disambiguation: %s - Marked as needing expert attention', + } + +# Summary message when adding Disambiguation Needed template to a redirect link +msg_redir_dn = { + 'en' : u'Robot-assisted disambiguation: %s - Marked as needing expert attention', + } + # Summary message to (unknown) unknown_msg = { 'ar' : u'(غير معروف)', @@ -417,7 +435,7 @@ self.primaryIgnoreManager = PrimaryIgnoreManager(disambPage, enabled=primary) self.minimum = minimum - + def __iter__(self): # TODO: start yielding before all referring pages have been found refs = [page for page in @@ -510,17 +528,18 @@ u'{{[Pp]rocessing}}', ), } - + primary_redir_template = { # Page.templates() format, first letter uppercase 'hu': u'Egyért-redir', } - - def __init__(self, always, alternatives, getAlternatives, generator, + + def __init__(self, always, alternatives, getAlternatives, dnSkip, generator, primary, main_only, minimum = 0): self.always = always self.alternatives = alternatives self.getAlternatives = getAlternatives + self.dnSkip = dnSkip self.generator = generator self.primary = primary self.main_only = main_only @@ -579,9 +598,12 @@ # group linktrail is the link trail, that's letters after ]] which # are part of the word. # note that the definition of 'letter' varies from language to language. - self.linkR = re.compile( - r'\[\[(?P<title>[^\]\|#]*)(?P<section>#[^\]\|]*)?(\|(?P<label>[^\]]*))?\]\](?P<linktrail>' - + linktrail + ')') + self.linkR = re.compile(r''' + \[\[ (?P<title> [^\[\]\|#]*) + (?P<section> \#[^\]\|]*)? + (\|(?P<label> [^\]]*))? \]\] + (?P<linktrail>%s)''' % linktrail, + flags=re.X) def treat(self, refPage, disambPage): """ @@ -591,10 +613,11 @@ refPage - A page linking to disambPage Returns False if the user pressed q to completely quit the program. Otherwise, returns True. - + """ # TODO: break this function up into subroutines! + dn_template_str = pywikibot.translate(self.mysite, dn_template) include = False unlink = False new_targets = [] @@ -647,6 +670,7 @@ original_text = text n = 0 curpos = 0 + dn = False edited = False # This loop will run until we have finished the current page while True: @@ -670,11 +694,23 @@ if foundlink.site != disambPage.site(): continue # check whether the link found is to disambPage - if foundlink.canonical_title() != disambPage.title(): + try: + if foundlink.canonical_title() != disambPage.title(): + continue + except pywikibot.Error: + # must be a broken link + pywikibot.output("Invalid link [[%s]] in page [[%s]]" + % (m.group('title'), refPage.title()), + level=pywikibot.VERBOSE) continue n += 1 # how many bytes should be displayed around the current link context = 60 + #there's a {{dn}} here already + already_dn = text[m.end() : m.end() + 8].find(dn_template_str[:4]) > -1 + if already_dn and self.dnSkip: + continue + # This loop will run while the user doesn't choose an option # that will actually change the page while True: @@ -697,10 +733,12 @@ if edited: choice = pywikibot.input( u"Option (#, r#, s=skip link, e=edit page, n=next page, u=unlink, q=quit,\n" +u" ?=tag with " + dn_template_str + ",\n" u" m=more context, l=list, a=add new, x=save in this form):") else: choice = pywikibot.input( u"Option (#, r#, s=skip link, e=edit page, n=next page, u=unlink, q=quit,\n" +u" ?=tag with " + dn_template_str + ",\n" u" m=more context, d=show disambiguation page, l=list, a=add new):") else: choice = self.always @@ -775,7 +813,21 @@ if trailing_chars: link_text += trailing_chars - if choice in ['u', 'U']: + if choice in ['?', '/']: + #small chunk of text to search + search_text = text[m.end() : m.end() + context] + #figure out where the link (and sentance) ends, put note there + end_of_word_match = re.search("\s", search_text) + if end_of_word_match: + position_split = end_of_word_match.start(0) + else: + position_split = 0 + #insert dab needed template + text = text[:m.end() + position_split] + dn_template_str \ + + text[m.end() + position_split:] + dn = True + continue + elif choice in ['u', 'U']: # unlink - we remove the section if there's any text = text[:m.start()] + link_text + text[m.end():] unlink = True @@ -852,7 +904,7 @@ pywikibot.showDiff(original_text, text) pywikibot.output(u'') # save the page - self.setSummaryMessage(disambPage, new_targets, unlink) + self.setSummaryMessage(disambPage, new_targets, unlink, dn) try: refPage.put_async(text,comment=self.comment) except pywikibot.LockedPage: @@ -936,7 +988,8 @@ self.alternatives += links return True - def setSummaryMessage(self, disambPage, new_targets=[], unlink=False): + def setSummaryMessage(self, disambPage, new_targets=[], unlink=False, + dn=False): # make list of new targets targets = '' for page_title in new_targets: @@ -968,23 +1021,25 @@ elif disambPage.isRedirectPage(): # when working on redirects, there's another summary message if unlink and not new_targets: - self.comment = pywikibot.translate( - self.mysite, - msg_redir_unlink - ) % disambPage.title() + self.comment = pywikibot.translate(self.mysite, + msg_redir_unlink) \ + % disambPage.title() + elif dn and not new_targets: + self.comment = pywikibot.translate(self.mysite, msg_redir_dn) \ + % disambPage.title() else: - self.comment = pywikibot.translate( - self.mysite, msg_redir - ) % (disambPage.title(), targets) + self.comment = pywikibot.translate(self.mysite, msg_redir) \ + % (disambPage.title(), targets) else: if unlink and not new_targets: - self.comment = pywikibot.translate( - self.mysite, msg_unlink - ) % disambPage.title() + self.comment = pywikibot.translate(self.mysite, msg_unlink) \ + % disambPage.title() + elif dn and not new_targets: + self.comment = pywikibot.translate(self.mysite, msg_dn) \ + % disambPage.title() else: - self.comment = pywikibot.translate( - self.mysite, msg - ) % (disambPage.title(), targets) + self.comment = pywikibot.translate(self.mysite, msg) \ + % (disambPage.title(), targets) def run(self): if self.main_only: @@ -1029,6 +1084,7 @@ always = None alternatives = [] getAlternatives = True + dnSkip = False # if the -file argument is used, page titles are dumped in this array. # otherwise it will only contain one page. generator = None @@ -1074,6 +1130,8 @@ alternatives.append(arg[5:]) elif arg == '-just': getAlternatives = False + elif arg == '-dnskip': + dnSkip = True elif arg == '-main': main_only = True elif arg.startswith('-min:'): @@ -1106,7 +1164,7 @@ page = pywikibot.Page(pywikibot.Link(pageTitle, pywikibot.getSite())) generator = iter([page]) - # if no disambiguation pages was given as an argument, and none was + # if no disambiguation page was given as an argument, and none was # read from a file, query the user if not generator: pageTitle = pywikibot.input( @@ -1114,12 +1172,12 @@ page = pywikibot.Page(pywikibot.Link(pageTitle, pywikibot.getSite())) generator = iter([page]) - bot = DisambiguationRobot(always, alternatives, getAlternatives, generator, - primary, main_only, minimum=minimum) + bot = DisambiguationRobot(always, alternatives, getAlternatives, dnSkip, + generator, primary, main_only, + minimum=minimum) bot.run() - if __name__ == "__main__": try: main()

14 years, 2 months

SVN: [7985] branches/rewrite/pywikibot

by russblau＠svn.wikimedia.org

Revision: 7985 Author: russblau Date: 2010-03-10 15:45:02 +0000 (Wed, 10 Mar 2010) Log Message: ----------- Replace logger.debug() statements with pywikibot.output(); needed to allow -debug flag to work, but breaks per-component debug (-debug:wiki). Further work in this area still needed. Modified Paths: -------------- branches/rewrite/pywikibot/__init__.py branches/rewrite/pywikibot/comms/http.py branches/rewrite/pywikibot/comms/threadedhttp.py branches/rewrite/pywikibot/login.py branches/rewrite/pywikibot/site.py branches/rewrite/pywikibot/throttle.py Modified: branches/rewrite/pywikibot/__init__.py =================================================================== --- branches/rewrite/pywikibot/__init__.py 2010-03-09 19:07:34 UTC (rev 7984) +++ branches/rewrite/pywikibot/__init__.py 2010-03-10 15:45:02 UTC (rev 7985) @@ -165,8 +165,9 @@ key = '%s:%s:%s' % (fam, code, user) if not key in _sites: _sites[key] = __Site(code=code, fam=fam, user=user, sysop=sysop) - logger.debug(u"Instantiating Site object '%(site)s'" - % {'site': _sites[key]}) + pywikibot.output(u"Instantiating Site object '%(site)s'" + % {'site': _sites[key]}, + level=pywikibot.DEBUG) return _sites[key] getSite = Site # alias for backwards-compability @@ -283,7 +284,8 @@ logger = logging.getLogger("pywiki.wiki") if not stopped: - logger.debug("stopme() called") + pywikibot.output(u"stopme() called", + level=pywikibot.DEBUG) count = sum(1 for thd in threadpool if thd.isAlive()) if count: pywikibot.output(u"Waiting for about %(count)s pages to be saved." Modified: branches/rewrite/pywikibot/comms/http.py =================================================================== --- branches/rewrite/pywikibot/comms/http.py 2010-03-09 19:07:34 UTC (rev 7984) +++ branches/rewrite/pywikibot/comms/http.py 2010-03-10 15:45:02 UTC (rev 7985) @@ -50,9 +50,11 @@ try: cookie_jar.load() except (IOError, cookielib.LoadError): - logger.debug("Loading cookies failed.") + pywikibot.output(u"Loading cookies failed.", + level=pywikibot.DEBUG) else: - logger.debug("Loaded cookies from file.") + pywikibot.output(u"Loaded cookies from file.", + level=pywikibot.DEBUG) # Build up HttpProcessors @@ -72,7 +74,8 @@ level=pywikibot.VERBOSE) for i in threads: i.join() - logger.debug('All threads finished.') + pywikibot.output(u"All threads finished.", + level=pywikibot.VERBOSE) atexit.register(_flush) # export cookie_jar to global namespace Modified: branches/rewrite/pywikibot/comms/threadedhttp.py =================================================================== --- branches/rewrite/pywikibot/comms/threadedhttp.py 2010-03-09 19:07:34 UTC (rev 7984) +++ branches/rewrite/pywikibot/comms/threadedhttp.py 2010-03-10 15:45:02 UTC (rev 7985) @@ -58,7 +58,8 @@ The pool drops excessive connections added. """ - logger.debug("Creating connection pool.") + pywikibot.output(u"Creating connection pool.", + level=pywikibot.DEBUG) self.connections = {} self.lock = threading.Lock() self.maxnum = maxnum @@ -67,8 +68,9 @@ """Destructor to close all connections in the pool.""" self.lock.acquire() try: - logger.debug("Closing connection pool (%s connections)" - % len(self.connections)) + pywikibot.output(u"Closing connection pool (%s connections)" + % len(self.connections), + level=pywikibot.DEBUG) for key in self.connections: for connection in self.connections[key]: connection.close() @@ -91,8 +93,9 @@ try: if identifier in self.connections: if len(self.connections[identifier]) > 0: - logger.debug("Retrieved connection from '%s' pool." - % identifier) + pywikibot.output(u"Retrieved connection from '%s' pool." + % identifier, + level=pywikibot.DEBUG) return self.connections[identifier].pop() return None finally: @@ -111,8 +114,9 @@ self.connections[identifier] = [] if len(self.connections[identifier]) == self.maxnum: - logger.debug('closing %s connection %r' - % (identifier, connection)) + pywikibot.output(u"closing %s connection %r" + % (identifier, connection), + level=pywikibot.DEBUG) connection.close() del connection else: @@ -206,9 +210,11 @@ # Redirect hack: we want to regulate redirects follow_redirects = self.follow_redirects self.follow_redirects = False - logger.debug('%r' % ( - (uri.replace("%7C","|"), - method, body, headers, max_redirects, connection_type),)) + pywikibot.output(u"%r" % ( + (uri.replace("%7C","|"), method, body, + headers, max_redirects, + connection_type),), + level=pywikibot.DEBUG) try: (response, content) = httplib2.Http.request( self, uri, method, body, headers, @@ -264,8 +270,9 @@ location) if authority == None: response['location'] = httplib2.urlparse.urljoin(uri, location) - logger.debug('Relative redirect: changed [%s] to [%s]' - % (location, response['location'])) + pywikibot.output(u"Relative redirect: changed [%s] to [%s]" + % (location, response['location']), + level=pywikibot.DEBUG) if response.status == 301 and method in ["GET", "HEAD"]: response['-x-permanent-redirect-url'] = response['location'] if "content-location" not in response: @@ -330,11 +337,13 @@ def run(self): # The Queue item is expected to either an HttpRequest object # or None (to shut down the thread) - logger.debug('Thread started, waiting for requests.') + pywikibot.output(u"Thread started, waiting for requests.", + level=pywikibot.DEBUG) while (True): item = self.queue.get() if item is None: - logger.debug('Shutting down thread.') + pywikibot.output(u"Shutting down thread.", + level=pywikibot.DEBUG) return try: item.data = self.http.request(*item.args, **item.kwargs) Modified: branches/rewrite/pywikibot/login.py =================================================================== --- branches/rewrite/pywikibot/login.py 2010-03-09 19:07:34 UTC (rev 7984) +++ branches/rewrite/pywikibot/login.py 2010-03-10 15:45:02 UTC (rev 7985) @@ -143,7 +143,8 @@ """ # THIS IS OVERRIDDEN IN data/api.py filename = config.datafilepath('pywikibot.lwp') - logger.debug(u"Storing cookies to %s" % filename) + pywikibot.output(u"Storing cookies to %s" % filename, + level=pywikibot.DEBUG) f = open(filename, 'w') f.write(data) f.close() Modified: branches/rewrite/pywikibot/site.py =================================================================== --- branches/rewrite/pywikibot/site.py 2010-03-09 19:07:34 UTC (rev 7984) +++ branches/rewrite/pywikibot/site.py 2010-03-10 15:45:02 UTC (rev 7985) @@ -761,8 +761,9 @@ def isBlocked(self, sysop=False): """Deprecated synonym for is_blocked""" - logger.debug( - "Site method 'isBlocked' should be changed to 'is_blocked'") + pywikibot.output( + u"Site method 'isBlocked' should be changed to 'is_blocked'", + level=pywikibot.DEBUG) return self.is_blocked(sysop) def checkBlocks(self, sysop = False): @@ -1113,7 +1114,8 @@ % (len(cache), self) ) for pagedata in rvgen: - logger.debug("Preloading %s" % pagedata) + pywikibot.output(u"Preloading %s" % pagedata, + level=pywikibot.DEBUG) try: if pagedata['title'] not in cache: pywikibot.output( @@ -1123,9 +1125,12 @@ ) continue except KeyError: - logger.debug("No 'title' in %s" % pagedata) - logger.debug("pageids=%s" % pageids) - logger.debug("titles=%s" % cache.keys()) + pywikibot.output(u"No 'title' in %s" % pagedata, + level=pywikibot.DEBUG) + pywikibot.output(u"pageids=%s" % pageids, + level=pywikibot.DEBUG) + pywikibot.output(u"titles=%s" % cache.keys(), + level=pywikibot.DEBUG) continue page = cache[pagedata['title']] api.update_page(page, pagedata) @@ -1150,7 +1155,8 @@ % (page.title(withSection=False, asLink=True), item['title'])) api.update_page(page, item) - logger.debug(str(item)) + pywikibot.output(unicode(item), + level=pywikibot.DEBUG) return item[tokentype + "token"] # following group of methods map more-or-less directly to API queries @@ -1555,8 +1561,9 @@ if not isinstance(namespace, int): raise Error("allpages: only one namespace permitted.") if includeredirects is not None: - logger.debug( -"allpages: 'includeRedirects' argument is deprecated; use 'filterredirs'.") + pywikibot.output( +u"allpages: 'includeRedirects' argument is deprecated; use 'filterredirs'.", + level=pywikibot.DEBUG) if includeredirects: if includeredirects == "only": filterredirs = True @@ -2241,12 +2248,14 @@ while True: try: result = req.submit() - logger.debug("editpage response: %s" % result) + pywikibot.output(u"editpage response: %s" % result, + level=pywikibot.DEBUG) except api.APIError, err: self.unlock_page(page) if err.code.endswith("anon") and self.logged_in(): - logger.debug( -"editpage: received '%s' even though bot is logged in" % err.code) + pywikibot.output( +u"editpage: received '%s' even though bot is logged in" % err.code, + level=pywikibot.DEBUG) errdata = { 'site': self, 'title': page.title(withSection=False), @@ -2263,8 +2272,10 @@ raise LockedPage(errdata['title']) if err.code in self._ep_errors: raise Error(self._ep_errors[err.code] % errdata) - logger.debug("editpage: Unexpected error code '%s' received." - % err.code) + pywikibot.output( + u"editpage: Unexpected error code '%s' received." + % err.code, + level=pywikibot.DEBUG) raise assert ("edit" in result and "result" in result["edit"]), result if result["edit"]["result"] == "Success": @@ -2375,11 +2386,13 @@ req['noredirect'] = "" try: result = req.submit() - logger.debug("movepage response: %s" % result) + pywikibot.output(u"movepage response: %s" % result, + level=pywikibot.DEBUG) except api.APIError, err: if err.code.endswith("anon") and self.logged_in(): - logger.debug( -"movepage: received '%s' even though bot is logged in" % err.code) + pywikibot.output( +u"movepage: received '%s' even though bot is logged in" % err.code, + level=pywikibot.DEBUG) errdata = { 'site': self, 'oldtitle': oldtitle, @@ -2390,8 +2403,9 @@ } if err.code in self._mv_errors: raise Error(self._mv_errors[err.code] % errdata) - logger.debug("movepage: Unexpected error code '%s' received." - % err.code) + pywikibot.output(u"movepage: Unexpected error code '%s' received." + % err.code, + level=pywikibot.DEBUG) raise finally: self.unlock_page(page) @@ -2461,8 +2475,9 @@ } if err.code in self._rb_errors: raise Error(self._rb_errors[err.code] % errdata) - logger.debug("rollback: Unexpected error code '%s' received." - % err.code) + pywikibot.output(u"rollback: Unexpected error code '%s' received." + % err.code, + level=pywikibot.DEBUG) raise finally: self.unlock_page(page) @@ -2508,8 +2523,9 @@ } if err.code in self._dl_errors: raise Error(self._dl_errors[err.code] % errdata) - logger.debug("delete: Unexpected error code '%s' received." - % err.code) + pywikibot.output(u"delete: Unexpected error code '%s' received." + % err.code, + level=pywikibot.DEBUG) raise finally: self.unlock_page(page) Modified: branches/rewrite/pywikibot/throttle.py =================================================================== --- branches/rewrite/pywikibot/throttle.py 2010-03-09 19:07:34 UTC (rev 7984) +++ branches/rewrite/pywikibot/throttle.py 2010-03-10 15:45:02 UTC (rev 7985) @@ -66,7 +66,8 @@ global pid self.lock.acquire() mysite = self.mysite - logger.debug("Checking multiplicity: pid = %(pid)s" % globals()) + pywikibot.output(u"Checking multiplicity: pid = %(pid)s" % globals(), + level=pywikibot.DEBUG) try: processes = [] my_pid = pid or 1 # start at 1 if global pid not yet set

14 years, 2 months

SVN: [7984] branches/rewrite/pywikibot/data/api.py

by russblau＠svn.wikimedia.org

Revision: 7984 Author: russblau Date: 2010-03-09 19:07:34 +0000 (Tue, 09 Mar 2010) Log Message: ----------- Implement Assert Edit extension (note: using assert=user, *not* assert=bot, because it may be possible to use the framework without a bot flag on some wikis); also convert various debug statements to pywikibot.output calls. Modified Paths: -------------- branches/rewrite/pywikibot/data/api.py Modified: branches/rewrite/pywikibot/data/api.py =================================================================== --- branches/rewrite/pywikibot/data/api.py 2010-03-09 08:14:34 UTC (rev 7983) +++ branches/rewrite/pywikibot/data/api.py 2010-03-09 19:07:34 UTC (rev 7984) @@ -79,7 +79,7 @@ Returns a dict containing the JSON data returned by the wiki. Normally, one of the dict keys will be equal to the value of the 'action' parameter. Errors are caught and raise an APIError exception. - + Example: >>> r = Request(site=mysite, action="query", meta="userinfo") @@ -99,7 +99,7 @@ [u'query'] >>> data[u'query'].keys() [u'userinfo', u'namespaces'] - + @param site: The Site to which the request will be submitted. If not supplied, uses the user's configured default Site. @param mime: If true, send in "multipart/form-data" format (default False) @@ -123,6 +123,15 @@ if "action" not in kwargs: raise ValueError("'action' specification missing from Request.") self.update(**kwargs) + self.write = self.params["action"] in ( + "edit", "move", "rollback", "delete", "undelete", + "protect", "block", "unblock", "watch", "patrol", + "import", "userrights", "upload" + ) + if self.write: + pywikibot.output(u"Adding user assertion", + level=pywikibot.DEBUG) + self.params["assert"] = "user" # make sure user is logged in # implement dict interface def __getitem__(self, key): @@ -151,7 +160,13 @@ for key in self.params: if isinstance(self.params[key], basestring): + # convert a stringified sequence into a list self.params[key] = self.params[key].split("|") + try: + iter(self.params[key]) + except TypeError: + # convert any non-iterable value into a single-element list + self.params[key] = [str(self.params[key])] if self.params["action"] == ['query']: meta = self.params.get("meta", []) if "userinfo" not in meta: @@ -187,27 +202,23 @@ + "/api.php?" + self.http_params() ) - + def submit(self): """Submit a query and parse the response. @return: The data retrieved from api.php (a dict) - + """ from pywikibot.comms import http from email.mime.multipart import MIMEMultipart from email.mime.nonmultipart import MIMENonMultipart - params = self.http_params() + paramstring = self.http_params() if self.site._loginstatus == -3: self.site.login(False) while True: action = self.params.get("action", "") - write = action in ( - "edit", "move", "rollback", "delete", "undelete", - "protect", "block", "unblock" - ) - self.site.throttle(write=write) + self.site.throttle(write=self.write) uri = self.site.scriptpath() + "/api.php" try: ssl = False @@ -256,22 +267,24 @@ rawdata = http.request(self.site, uri, ssl, method="POST", headers={'Content-Type': 'application/x-www-form-urlencoded'}, - body=params) + body=paramstring) except Server504Error: - logger.debug(u"Caught 504 error") + pywikibot.output(u"Caught 504 error", + level=pywikibot.DEBUG) raise #TODO: what other exceptions can occur here? except Exception, e: # for any other error on the http request, wait and retry pywikibot.output(traceback.format_exc(), level=pywikibot.ERROR) - pywikibot.output(u"%s, %s" % (uri, params), + pywikibot.output(u"%s, %s" % (uri, paramstring), level=pywikibot.VERBOSE) self.wait() continue if not isinstance(rawdata, unicode): rawdata = rawdata.decode(self.site.encoding()) - logger.debug(u"API response received:\n" + rawdata) + pywikibot.output(u"API response received:\n" + rawdata, + level=pywikibot.DEBUG) if rawdata.startswith(u"unknown_action"): raise APIError(rawdata[:14], rawdata[16:]) try: @@ -281,8 +294,10 @@ # problem. Wait a few seconds and try again pywikibot.output( "Non-JSON response received from server %s; the server may be down." - % self.site, level=pywikibot.WARNING) - logger.debug(rawdata) + % self.site, + level=pywikibot.WARNING) + pywikibot.output(rawdata, + level=pywikibot.DEBUG) self.wait() continue if not result: @@ -389,6 +404,7 @@ self.site = kwargs["site"] except KeyError: self.site = pywikibot.Site() + kwargs["site"] = self.site # make sure request type is valid, and get limit key if any for modtype in ("generator", "list", "prop", "meta"): if modtype in kwargs: @@ -417,7 +433,7 @@ def get_module(self): """Query api on self.site for paraminfo on querymodule=self.module""" - + paramreq = Request(site=self.site, action="paraminfo", querymodules=self.module) data = paramreq.submit() @@ -456,7 +472,7 @@ """ self.limit = int(value) - + def update_limit(self): """Set query_limit for self.module based on api response""" @@ -472,9 +488,10 @@ self.query_limit = int(param["max"]) if self.prefix is None: self.prefix = _modules[mod]["prefix"] - logger.debug(u"%s: Set query_limit to %i." - % (self.__class__.__name__, - self.query_limit)) + pywikibot.output(u"%s: Set query_limit to %i." + % (self.__class__.__name__, + self.query_limit), + level=pywikibot.DEBUG) return def set_namespace(self, namespaces): @@ -522,27 +539,34 @@ self.set_query_increment(old_limit // 2) continue if not self.data or not isinstance(self.data, dict): - logger.debug( + pywikibot.output( u"%s: stopped iteration because no dict retrieved from api." - % self.__class__.__name__) + % self.__class__.__name__, + level=pywikibot.DEBUG) return if not ("query" in self.data and self.resultkey in self.data["query"]): - logger.debug( + pywikibot.output( u"%s: stopped iteration because 'query' and '%s' not found in api response." - % (self.__class__.__name__, self.resultkey)) - logger.debug(unicode(self.data)) + % (self.__class__.__name__, self.resultkey), + level=pywikibot.DEBUG) + pywikibot.output(unicode(self.data), + level=pywikibot.DEBUG) return resultdata = self.data["query"][self.resultkey] if isinstance(resultdata, dict): - logger.debug(u"%s received %s; limit=%s" - % (self.__class__.__name__, resultdata.keys(), - self.limit)) + pywikibot.output(u"%s received %s; limit=%s" + % (self.__class__.__name__, + resultdata.keys(), + self.limit), + level=pywikibot.DEBUG) resultdata = [resultdata[k] for k in sorted(resultdata.keys())] else: - logger.debug(u"%s received %s; limit=%s" - % (self.__class__.__name__, resultdata, - self.limit)) + pywikibot.output(u"%s received %s; limit=%s" + % (self.__class__.__name__, + resultdata, + self.limit), + level=pywikibot.DEBUG) if "normalized" in self.data["query"]: self.normalized = dict((item['to'], item['from']) for item in @@ -581,13 +605,13 @@ This class can be used for any of the query types that are listed in the API documentation as being able to be used as a generator. Instances of this class iterate Page objects. - + """ def __init__(self, generator, **kwargs): """ Required and optional parameters are as for C{Request}, except that action=query is assumed and generator is required. - + @param generator: the "generator=" type from api.php @type generator: str @@ -614,7 +638,7 @@ This can be overridden in subclasses to return a different type of object. - + """ p = pywikibot.Page(self.site, pagedata['title'], pagedata['ns']) update_page(p, pagedata) @@ -657,7 +681,7 @@ """ Required and optional parameters are as for C{Request}, except that action=query is assumed and prop is required. - + @param prop: the "property=" type from api.php @type prop: str @@ -684,7 +708,7 @@ """ Required and optional parameters are as for C{Request}, except that action=query is assumed and listaction is required. - + @param listaction: the "list=" type from api.php @type listaction: str @@ -700,7 +724,7 @@ def __init__(self, logtype, **kwargs): ListGenerator.__init__(self, "logevents", **kwargs) - import logentries + import logentries self.entryFactory = logentries.LogEntryFactory(logtype) def result(self, pagedata): @@ -715,7 +739,7 @@ Parameters are all ignored. Returns cookie data if succesful, None otherwise. - + """ if hasattr(self, '_waituntil'): if datetime.now() < self._waituntil:

14 years, 2 months

2024

2023

2022

2021

2020

2019

2018

2017

2016

2015

2014

2013

2012

2011

2010

2009

Pywikipedia-svn March 2010