aboutsummaryrefslogtreecommitdiffstats
path: root/contrib/python/Pygments/py3/pygments/lexers/praat.py
blob: 112d583acbcb27f32e2a73f85ba4c256aea033da (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
""" 
    pygments.lexers.praat 
    ~~~~~~~~~~~~~~~~~~~~~ 
 
    Lexer for Praat 
 
    :copyright: Copyright 2006-2021 by the Pygments team, see AUTHORS.
    :license: BSD, see LICENSE for details. 
""" 
 
from pygments.lexer import RegexLexer, words, bygroups, include 
from pygments.token import Name, Text, Comment, Keyword, String, Punctuation, Number, \ 
    Operator 
 
__all__ = ['PraatLexer'] 
 
 
class PraatLexer(RegexLexer): 
    """ 
    For `Praat <http://www.praat.org>`_ scripts. 
 
    .. versionadded:: 2.1 
    """ 
 
    name = 'Praat' 
    aliases = ['praat'] 
    filenames = ['*.praat', '*.proc', '*.psc'] 
 
    keywords = (
        'if', 'then', 'else', 'elsif', 'elif', 'endif', 'fi', 'for', 'from', 'to', 
        'endfor', 'endproc', 'while', 'endwhile', 'repeat', 'until', 'select', 'plus', 
        'minus', 'demo', 'assert', 'stopwatch', 'nocheck', 'nowarn', 'noprogress', 
        'editor', 'endeditor', 'clearinfo', 
    )
 
    functions_string = (
        'backslashTrigraphsToUnicode', 'chooseDirectory', 'chooseReadFile', 
        'chooseWriteFile', 'date', 'demoKey', 'do', 'environment', 'extractLine', 
        'extractWord', 'fixed', 'info', 'left', 'mid', 'percent', 'readFile', 'replace', 
        'replace_regex', 'right', 'selected', 'string', 'unicodeToBackslashTrigraphs', 
    )
 
    functions_numeric = (
        'abs', 'appendFile', 'appendFileLine', 'appendInfo', 'appendInfoLine', 'arccos', 
        'arccosh', 'arcsin', 'arcsinh', 'arctan', 'arctan2', 'arctanh', 'barkToHertz', 
        'beginPause', 'beginSendPraat', 'besselI', 'besselK', 'beta', 'beta2', 
        'binomialP', 'binomialQ', 'boolean', 'ceiling', 'chiSquareP', 'chiSquareQ', 
        'choice', 'comment', 'cos', 'cosh', 'createDirectory', 'deleteFile', 
        'demoClicked', 'demoClickedIn', 'demoCommandKeyPressed', 
        'demoExtraControlKeyPressed', 'demoInput', 'demoKeyPressed', 
        'demoOptionKeyPressed', 'demoShiftKeyPressed', 'demoShow', 'demoWaitForInput', 
        'demoWindowTitle', 'demoX', 'demoY', 'differenceLimensToPhon', 'do', 'editor', 
        'endPause', 'endSendPraat', 'endsWith', 'erb', 'erbToHertz', 'erf', 'erfc', 
        'exitScript', 'exp', 'extractNumber', 'fileReadable', 'fisherP', 'fisherQ', 
        'floor', 'gaussP', 'gaussQ', 'hertzToBark', 'hertzToErb', 'hertzToMel', 
        'hertzToSemitones', 'imax', 'imin', 'incompleteBeta', 'incompleteGammaP', 'index', 
        'index_regex', 'integer', 'invBinomialP', 'invBinomialQ', 'invChiSquareQ', 'invFisherQ',
        'invGaussQ', 'invSigmoid', 'invStudentQ', 'length', 'ln', 'lnBeta', 'lnGamma', 
        'log10', 'log2', 'max', 'melToHertz', 'min', 'minusObject', 'natural', 'number', 
        'numberOfColumns', 'numberOfRows', 'numberOfSelected', 'objectsAreIdentical', 
        'option', 'optionMenu', 'pauseScript', 'phonToDifferenceLimens', 'plusObject', 
        'positive', 'randomBinomial', 'randomGauss', 'randomInteger', 'randomPoisson', 
        'randomUniform', 'real', 'readFile', 'removeObject', 'rindex', 'rindex_regex', 
        'round', 'runScript', 'runSystem', 'runSystem_nocheck', 'selectObject', 
        'selected', 'semitonesToHertz', 'sentence', 'sentencetext', 'sigmoid', 'sin', 'sinc',
        'sincpi', 'sinh', 'soundPressureToPhon', 'sqrt', 'startsWith', 'studentP', 
        'studentQ', 'tan', 'tanh', 'text', 'variableExists', 'word', 'writeFile', 'writeFileLine',
        'writeInfo', 'writeInfoLine', 
    )
 
    functions_array = (
        'linear', 'randomGauss', 'randomInteger', 'randomUniform', 'zero', 
    )
 
    objects = (
        'Activation', 'AffineTransform', 'AmplitudeTier', 'Art', 'Artword', 
        'Autosegment', 'BarkFilter', 'BarkSpectrogram', 'CCA', 'Categories', 
        'Cepstrogram', 'Cepstrum', 'Cepstrumc', 'ChebyshevSeries', 'ClassificationTable', 
        'Cochleagram', 'Collection', 'ComplexSpectrogram', 'Configuration', 'Confusion', 
        'ContingencyTable', 'Corpus', 'Correlation', 'Covariance', 
        'CrossCorrelationTable', 'CrossCorrelationTables', 'DTW', 'DataModeler', 
        'Diagonalizer', 'Discriminant', 'Dissimilarity', 'Distance', 'Distributions', 
        'DurationTier', 'EEG', 'ERP', 'ERPTier', 'EditCostsTable', 'EditDistanceTable', 
        'Eigen', 'Excitation', 'Excitations', 'ExperimentMFC', 'FFNet', 'FeatureWeights', 
        'FileInMemory', 'FilesInMemory', 'Formant', 'FormantFilter', 'FormantGrid', 
        'FormantModeler', 'FormantPoint', 'FormantTier', 'GaussianMixture', 'HMM', 
        'HMM_Observation', 'HMM_ObservationSequence', 'HMM_State', 'HMM_StateSequence', 
        'Harmonicity', 'ISpline', 'Index', 'Intensity', 'IntensityTier', 'IntervalTier', 
        'KNN', 'KlattGrid', 'KlattTable', 'LFCC', 'LPC', 'Label', 'LegendreSeries', 
        'LinearRegression', 'LogisticRegression', 'LongSound', 'Ltas', 'MFCC', 'MSpline', 
        'ManPages', 'Manipulation', 'Matrix', 'MelFilter', 'MelSpectrogram', 
        'MixingMatrix', 'Movie', 'Network', 'Object', 'OTGrammar', 'OTHistory', 'OTMulti',
        'PCA', 'PairDistribution', 'ParamCurve', 'Pattern', 'Permutation', 'Photo',
        'Pitch', 'PitchModeler', 'PitchTier', 'PointProcess', 'Polygon', 'Polynomial',
        'PowerCepstrogram', 'PowerCepstrum', 'Procrustes', 'RealPoint', 'RealTier', 
        'ResultsMFC', 'Roots', 'SPINET', 'SSCP', 'SVD', 'Salience', 'ScalarProduct', 
        'Similarity', 'SimpleString', 'SortedSetOfString', 'Sound', 'Speaker', 
        'Spectrogram', 'Spectrum', 'SpectrumTier', 'SpeechSynthesizer', 'SpellingChecker', 
        'Strings', 'StringsIndex', 'Table', 'TableOfReal', 'TextGrid', 'TextInterval', 
        'TextPoint', 'TextTier', 'Tier', 'Transition', 'VocalTract', 'VocalTractTier', 
        'Weight', 'WordList', 
    )
 
    variables_numeric = (
        'macintosh', 'windows', 'unix', 'praatVersion', 'pi', 'e', 'undefined', 
    )
 
    variables_string = (
        'praatVersion', 'tab', 'shellDirectory', 'homeDirectory', 
        'preferencesDirectory', 'newline', 'temporaryDirectory', 
        'defaultDirectory', 
    )
 
    object_attributes = (
        'ncol', 'nrow', 'xmin', 'ymin', 'xmax', 'ymax', 'nx', 'ny', 'dx', 'dy',
    )

    tokens = { 
        'root': [ 
            (r'(\s+)(#.*?$)',  bygroups(Text, Comment.Single)), 
            (r'^#.*?$',        Comment.Single), 
            (r';[^\n]*',       Comment.Single), 
            (r'\s+',           Text), 
 
            (r'\bprocedure\b', Keyword,       'procedure_definition'), 
            (r'\bcall\b',      Keyword,       'procedure_call'), 
            (r'@',             Name.Function, 'procedure_call'), 
 
            include('function_call'), 
 
            (words(keywords, suffix=r'\b'), Keyword), 
 
            (r'(\bform\b)(\s+)([^\n]+)', 
             bygroups(Keyword, Text, String), 'old_form'), 
 
            (r'(print(?:line|tab)?|echo|exit|asserterror|pause|send(?:praat|socket)|' 
             r'include|execute|system(?:_nocheck)?)(\s+)', 
             bygroups(Keyword, Text), 'string_unquoted'), 
 
            (r'(goto|label)(\s+)(\w+)', bygroups(Keyword, Text, Name.Label)), 
 
            include('variable_name'), 
            include('number'), 
 
            (r'"', String, 'string'), 
 
            (words((objects), suffix=r'(?=\s+\S+\n)'), Name.Class, 'string_unquoted'), 
 
            (r'\b[A-Z]', Keyword, 'command'), 
            (r'(\.{3}|[)(,])', Punctuation), 
        ], 
        'command': [ 
            (r'( ?[\w()-]+ ?)', Keyword), 

            include('string_interpolated'),

            (r'\.{3}', Keyword, ('#pop', 'old_arguments')), 
            (r':', Keyword, ('#pop', 'comma_list')), 
            (r'\s', Text, '#pop'),
        ], 
        'procedure_call': [ 
            (r'\s+', Text), 
            (r'([\w.]+)(:|\s*\()', 
             bygroups(Name.Function, Text), '#pop'), 
            (r'([\w.]+)', Name.Function, ('#pop', 'old_arguments')), 
        ], 
        'procedure_definition': [ 
            (r'\s', Text), 
            (r'([\w.]+)(\s*?[(:])', 
             bygroups(Name.Function, Text), '#pop'), 
            (r'([\w.]+)([^\n]*)', 
             bygroups(Name.Function, Text), '#pop'), 
        ], 
        'function_call': [ 
            (words(functions_string, suffix=r'\$(?=\s*[:(])'), Name.Function, 'function'), 
            (words(functions_array, suffix=r'#(?=\s*[:(])'),   Name.Function, 'function'),
            (words(functions_numeric, suffix=r'(?=\s*[:(])'),  Name.Function, 'function'),
        ], 
        'function': [ 
            (r'\s+',   Text), 
            (r':',     Punctuation, ('#pop', 'comma_list')), 
            (r'\s*\(', Punctuation, ('#pop', 'comma_list')), 
        ], 
        'comma_list': [ 
            (r'(\s*\n\s*)(\.{3})', bygroups(Text, Punctuation)), 
 
            (r'(\s*[])\n])', Text, '#pop'), 
 
            (r'\s+', Text), 
            (r'"',   String, 'string'), 
            (r'\b(if|then|else|fi|endif)\b', Keyword), 
 
            include('function_call'), 
            include('variable_name'), 
            include('operator'), 
            include('number'), 
 
            (r'[()]', Text),
            (r',', Punctuation), 
        ], 
        'old_arguments': [ 
            (r'\n', Text, '#pop'), 
 
            include('variable_name'), 
            include('operator'), 
            include('number'), 
 
            (r'"', String, 'string'), 
            (r'[^\n]', Text), 
        ], 
        'number': [ 
            (r'\n', Text, '#pop'),
            (r'\b\d+(\.\d*)?([eE][-+]?\d+)?%?', Number), 
        ], 
        'object_reference': [
            include('string_interpolated'),
            (r'([a-z][a-zA-Z0-9_]*|\d+)', Name.Builtin),

            (words(object_attributes, prefix=r'\.'), Name.Builtin, '#pop'),

            (r'\$', Name.Builtin),
            (r'\[', Text, '#pop'),
        ], 
        'variable_name': [ 
            include('operator'), 
            include('number'), 
 
            (words(variables_string,  suffix=r'\$'), Name.Variable.Global), 
            (words(variables_numeric,
             suffix=r'(?=[^a-zA-Z0-9_."\'$#\[:(]|\s|^|$)'),
             Name.Variable.Global),
 
            (words(objects, prefix=r'\b', suffix=r"(_)"),
             bygroups(Name.Builtin, Name.Builtin),
             'object_reference'),
 
            (r'\.?_?[a-z][\w.]*(\$|#)?', Text),
            (r'[\[\]]', Punctuation, 'comma_list'), 

            include('string_interpolated'),
        ], 
        'operator': [ 
            (r'([+\/*<>=!-]=?|[&*|][&*|]?|\^|<>)',       Operator),
            (r'(?<![\w.])(and|or|not|div|mod)(?![\w.])', Operator.Word),
        ], 
        'string_interpolated': [ 
            (r'\'[_a-z][^\[\]\'":]*(\[([\d,]+|"[\w,]+")\])?(:[0-9]+)?\'',
             String.Interpol), 
        ], 
        'string_unquoted': [ 
            (r'(\n\s*)(\.{3})', bygroups(Text, Punctuation)), 
 
            (r'\n',       Text,            '#pop'), 
            (r'\s',       Text), 

            include('string_interpolated'),

            (r"'",        String), 
            (r"[^'\n]+",  String), 
        ], 
        'string': [ 
            (r'(\n\s*)(\.{3})', bygroups(Text, Punctuation)), 
 
            (r'"',          String,          '#pop'), 

            include('string_interpolated'),

            (r"'",          String), 
            (r'[^\'"\n]+',  String), 
        ], 
        'old_form': [ 
            (r'(\s+)(#.*?$)',  bygroups(Text, Comment.Single)),
            (r'\s+', Text), 
 
            (r'(optionmenu|choice)([ \t]+\S+:[ \t]+)', 
             bygroups(Keyword, Text), 'number'), 
 
            (r'(option|button)([ \t]+)', 
             bygroups(Keyword, Text), 'string_unquoted'), 
 
            (r'(sentence|text)([ \t]+\S+)', 
             bygroups(Keyword, Text), 'string_unquoted'), 
 
            (r'(word)([ \t]+\S+[ \t]*)(\S+)?([ \t]+.*)?', 
             bygroups(Keyword, Text, String, Text)), 
 
            (r'(boolean)(\s+\S+\s*)(0|1|"?(?:yes|no)"?)', 
             bygroups(Keyword, Text, Name.Variable)), 
 
            # Ideally processing of the number would happend in the 'number' 
            # but that doesn't seem to work 
            (r'(real|natural|positive|integer)([ \t]+\S+[ \t]*)([+-]?)(\d+(?:\.\d*)?' 
             r'(?:[eE][-+]?\d+)?%?)', 
             bygroups(Keyword, Text, Operator, Number)), 
 
            (r'(comment)(\s+)', 
             bygroups(Keyword, Text), 'string_unquoted'), 
 
            (r'\bendform\b', Keyword, '#pop'), 
        ] 
    }