~domy/corpusfiltergraph/old-main

« back to all changes in this revision

Viewing changes to lib/corpusfg/plugins/remove-irrelevant-right.py

  • Committer: tahoar at precisiontranslationtools
  • Date: 2013-08-19 03:46:05 UTC
  • Revision ID: tahoar@precisiontranslationtools.com-20130819034605-o6o6lf0l7myw33ip
updated demo-1 scripts to separate champollion demo. forced '%s\x0a' newline charachers, normalized null-copy-file.py name.

Show diffs side-by-side

added added

removed removed

Lines of Context:
6
6
#===============================================================================
7
7
 
8
8
#version:
9
 
#4.5.337 - bugfix for UTF-8 in values that become folder names
 
9
#4.5.343 - added CJK punctuation
10
10
 
11
11
import os
12
12
import sys
17
17
 
18
18
logger = logging.getLogger('.'.join([os.path.splitext(os.path.basename(sys.argv[0]))[0],'manager','filtergraph',__name__]))
19
19
skipclose = True
20
 
extended = u'€‚ƒ„…†‡ˆ‰Š‹Œ‘’“”•–—˜™›¡¢£¤¥¦§¨©ª«¬­®¯°±²³´µ¶·¸¹º»¼½¾¿÷˗⁻₋−'
 
20
extended = u'€‚ƒ„…†‡ˆ‰Š‹Œ‘’“”•–—˜™›¡¢£¤¥¦§¨©ª«¬­®¯°±²³´µ¶·¸¹º»¼½¾¿÷˗⁻₋−:。、'
21
21
whitespace = u'         \x0b\x0c         ​'
22
22
 
23
23
class filter(object):
31
31
                'encoding': 'utf8',
32
32
                'inputfile': '',
33
33
                'outputfile': '',
34
 
                'version': '4.5.337',
 
34
                'version': '4.5.343',
35
35
                }
36
36
 
37
37