User:WindBOT/CoreSource: Difference between revisions

Jump to navigation Jump to search
mNo edit summary
(rm py2.7 hax, +extra possibilities for word boundaries in cyrillic, +better arrow symbols)
Line 30: Line 30:
import wikiUpload
import wikiUpload
import feedparser
import feedparser
# Hax for Python < 2.7
try:
from collections import OrderedDict
except:
from backport_OrderedDict import OrderedDict
import collections
collections.OrderedDict = OrderedDict
try:
try:
import steam
import steam
Line 159: Line 152:
summary = getSummary(summary)
summary = getSummary(summary)
p = page(p)
p = page(p)
print 'Editing', p.title, 'with summary', summary
try:
print 'Editing', p.title, 'with summary', summary
except:
pass
try:
try:
if nocreate:
if nocreate:
Line 777: Line 773:
return setFilterName(curry(dumbReplacement, rs), u'DumbReplacements(' + u(rs) + u')')
return setFilterName(curry(dumbReplacement, rs), u'DumbReplacements(' + u(rs) + u')')
def dumbReplace(subject, replacement):
def dumbReplace(subject, replacement):
return setFilterName(dumbReplaces({subject: replacement}), u'DumbReplacement(' + u(subject) + u' -> ' + u(replacement) + u')')
return setFilterName(dumbReplaces({subject: replacement}), u'DumbReplacement(' + u(subject) + u' \u2192 ' + u(replacement) + u')')
def wordRegex(word, **kwargs):
def wordRegex(word, **kwargs):
flags = None
flags = None
Line 784: Line 780:
word = word[0]
word = word[0]
word = u(re.sub(r'[-_ ]+', r'[-_ ]', u(word)))
word = u(re.sub(r'[-_ ]+', r'[-_ ]', u(word)))
word = u(r"(?<![\u00E8-\u00F8\xe8-\xf8\w])(?<!'')(?<!" + r'"' + r")(?:\b|^)" + word + r"(?:\b(?![\u00E8-\u00F8\xe8-\xf8\w])(?!''|" + r'"' + r")|$)")
word = u(r"(?<![\u00E8-\u00F8\xe8-\xf8\w])(?<!'')(?<!" + r'"' + ")(?:\\b|(?<=[ \\[\\]\\(\\):;.,\"'*\\xab\\xbb])|^)" + word + r"(?:\b(?![\u00E8-\u00F8\xe8-\xf8\w])(?!''|" + r'"' + ")|(?=[ \\[\\]\(\\):;.,\"'*\\xab\\xbb])|$)")
if flags is None:
if flags is None:
return word
return word
Line 809: Line 805:
else:
else:
rs[wordRegex(w, **kwargs)] = correct
rs[wordRegex(w, **kwargs)] = correct
return setFilterName(regexes(rs), u'WordFilter(' + u'/'.join(badwords2) + u' -> ' + correct + u')')
return setFilterName(regexes(rs), u'WordFilter(' + u'/'.join(badwords2) + u' \u2192 ' + correct + u')')
def enforceCapitalization(*words, **kwargs):
def enforceCapitalization(*words, **kwargs):
for w in words:
for w in words: