if __name__ == '__main__':
import sys
- if len(sys.argv)<2:
+ from optparse import OptionParser
+ parser = OptionParser(usage='%prog [options] string')
+ parser.add_option('--charset', help="set charset. default=%default", action='store', dest='charset', default='utf-8')
+ parser.add_option('-r', '--regexp', help="generate regular expression.", action='store_true', dest='regexp')
+ (options, args) = parser.parse_args()
+
+ if not args:
print >> sys.stderr, u'Missing required parameter. Try "Œuf"'
sys.exit(1)
- input = unicode(' '.join(sys.argv[1:]), 'utf-8')
- print "input:", input # Œuf
- print "undecorated:", remove_decoration(input) # Oeuf
- print "regex:", decorated_match(input) # (œ|Œ|[oòóôöøōŏőOÒÓÔÖØŌŎŐ][eèéêëēĕėęěEÈÉÊËĒĔĖĘĚ])[uùúûüũūŭůűųUÙÚÛÜŨŪŬŮŰŲ][fF]
+ input = unicode(' '.join(args), options.charset)
+ #print "input:", input # Œuf
+ #print "undecorated:", remove_decoration(input) # Oeuf
+ #print "regex:", decorated_match(input) # (œ|Œ|[oòóôöøōŏőOÒÓÔÖØŌŎŐ][eèéêëēĕėęěEÈÉÊËĒĔĖĘĚ])[uùúûüũūŭůűųUÙÚÛÜŨŪŬŮŰŲ][fF]
+ if options.regexp:
+ print decorated_match(input).encode(options.charset)
+ else:
+ print remove_decoration(input).encode(options.charset)