Permalink
Jan 14, 2015
Jan 14, 2015
Jan 1, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 14, 2015
Jan 1, 2015
Jan 1, 2015
Jan 1, 2015
Newer
100644
1628 lines (1457 sloc)
50.8 KB
9
__name__:'str',
10
$native:true
11
}
12
13
$StringDict.__add__ = function(self,other){
14
if(!(typeof other==="string")){
15
try{return getattr(other,'__radd__')(self)}
16
catch(err){throw _b_.TypeError(
17
"Can't convert "+$B.get_class(other).__name__+" to str implicitely")}
18
}
19
return self+other
20
}
21
22
$StringDict.__contains__ = function(self,item){
23
if(!(typeof item==="string")){throw _b_.TypeError(
24
"'in <string>' requires string as left operand, not "+item.__class__)}
25
var nbcar = item.length
26
if(nbcar==0) return true // a string contains the empty string
27
if(self.length==0) return nbcar==0
29
if(self.substr(i,nbcar)==item) return true
30
}
31
return false
32
}
33
34
$StringDict.__delitem__ = function(){
35
throw _b_.TypeError("'str' object doesn't support item deletion")
36
}
37
38
// __dir__must be assigned explicitely because attribute resolution for builtin
39
// classes doesn't use __mro__
40
$StringDict.__dir__ = $ObjectDict.__dir__
41
42
$StringDict.__eq__ = function(self,other){
43
if(other===undefined){ // compare object "self" to class "str"
44
return self===str
45
}
46
if (_b_.isinstance(other, _b_.str)) {
47
return other.valueOf() == self.valueOf()
48
}
52
function preformat(self, fmt){
53
if(fmt.empty){return _b_.str(self)}
54
if(fmt.type && fmt.type!='s'){
55
throw _b_.ValueError("Unknown format code '"+fmt.type+
56
"' for object of type 'str'")
57
}
58
return self
59
}
60
61
$StringDict.__format__ = function(self, format_spec) {
62
var fmt = new $B.parse_format_spec(format_spec)
63
// For strings, alignment default to left
64
fmt.align = fmt.align || '<'
65
return $B.format_width(preformat(self, fmt), fmt)
66
}
67
68
$StringDict.__getitem__ = function(self,arg){
69
if(isinstance(arg,_b_.int)){
70
var pos = arg
71
if(arg<0) pos+=self.length
72
if(pos>=0 && pos<self.length) return self.charAt(pos)
73
throw _b_.IndexError('string index out of range')
74
}
75
if(isinstance(arg,slice)) {
76
var step = arg.step===None ? 1 : arg.step
77
if(step>0){
78
var start = arg.start===None ? 0 : arg.start
79
var stop = arg.stop===None ? getattr(self,'__len__')() : arg.stop
80
}else{
81
var start = arg.start===None ? getattr(self,'__len__')()-1 : arg.start
86
var res = '',i=null
87
if(step>0){
88
if(stop<=start) return ''
89
for(var i=start;i<stop;i+=step) res += self.charAt(i)
90
} else {
91
if(stop>=start) return ''
93
}
94
return res
95
}
96
if(isinstance(arg,bool)) return self.__getitem__(_b_.int(arg))
101
if (self === undefined) {
102
return $StringDict.__hashvalue__ || $B.$py_next_hash-- // for hash of string type (not instance of string)
103
}
104
105
//http://stackoverflow.com/questions/2909106/python-whats-a-correct-and-good-way-to-implement-hash
106
// this implementation for strings maybe good enough for us..
107
108
var hash=1;
110
hash=(101*hash + self.charCodeAt(i)) & 0xFFFFFFFF
111
}
112
113
return hash
114
}
115
116
$StringDict.__init__ = function(self,arg){
117
self.valueOf = function(){return arg}
118
self.toString = function(){return arg}
120
}
121
122
var $str_iterator = $B.$iterator_class('str_iterator')
123
$StringDict.__iter__ = function(self){
124
var items = self.split('') // list of all characters in string
125
return $B.$iterator(items,$str_iterator)
126
}
127
128
$StringDict.__len__ = function(self){return self.length}
129
132
var kwarg_key = new RegExp('([^\\)]*)\\)')
133
134
var NotANumber = function() {
135
this.name = 'NotANumber'
136
}
137
138
var number_check=function(s) {
139
if(!isinstance(s,[_b_.int,_b_.float])){
140
throw new NotANumber()
141
}
142
}
143
144
var get_char_array = function(size, char) {
145
if (size <= 0)
146
return ''
147
return new Array(size + 1).join(char)
148
}
149
150
var format_padding = function(s, flags, minus_one) {
151
var padding = flags.padding
152
if (!padding) { // undefined
153
return s
154
}
155
s = s.toString()
156
padding = parseInt(padding, 10)
157
if (minus_one) { // numeric formatting where sign goes in front of padding
158
padding -= 1
159
}
160
if (!flags.left) {
161
return get_char_array(padding - s.length, flags.pad_char) + s
162
} else {
163
// left adjusted
164
return s + get_char_array(padding - s.length, flags.pad_char)
165
}
166
}
167
168
var format_int_precision = function(val, flags) {
169
var precision = flags.precision
170
if (!precision) {
171
return val.toString()
172
}
173
precision = parseInt(precision, 10)
174
var s
175
if (val.__class__ === $B.LongInt.$dict) {
176
s=$B.LongInt.$dict.to_base(val, 10)
177
} else {
178
s=val.toString()
179
}
180
var sign = s[0]
181
if (s[0] === '-') {
182
return '-' + get_char_array(precision - s.length + 1, '0') + s.slice(1)
183
}
184
return get_char_array(precision - s.length, '0') + s
185
}
186
187
var format_float_precision = function(val, upper, flags, modifier) {
188
var precision = flags.precision
189
// val is a float
190
if (isFinite(val)) {
191
val = modifier(val, precision, flags, upper)
192
return val
193
}
194
if (val === Infinity) {
195
val = 'inf'
196
} else if (val === -Infinity) {
197
val = '-inf'
198
} else {
199
val = 'nan'
200
}
201
if (upper) {
202
return val.toUpperCase()
203
}
204
return val
206
}
207
208
var format_sign = function(val, flags) {
209
if (flags.sign) {
210
if (val >= 0) {
211
return "+"
213
} else if (flags.space) {
214
if (val >= 0) {
215
return " "
216
}
217
}
218
return ""
219
}
221
var str_format = function(val, flags) {
222
// string format supports left and right padding
223
flags.pad_char = " " // even if 0 padding is defined, don't use it
224
return format_padding(str(val), flags)
225
}
229
if (val.__class__ === $B.LongInt.$dict) {
230
val = $B.LongInt.$dict.to_base(val, 10)
231
} else {
232
val = parseInt(val)
233
}
234
235
var s = format_int_precision(val, flags)
236
if (flags.pad_char === '0') {
237
if (val < 0) {
238
s = s.substring(1)
239
return '-' + format_padding(s, flags, true)
240
}
241
var sign = format_sign(val, flags)
242
if (sign !== '') {
243
return sign + format_padding(s, flags, true)
244
}
245
}
246
247
return format_padding(format_sign(val, flags) + s, flags)
248
}
250
var repr_format = function(val, flags) {
251
flags.pad_char = " " // even if 0 padding is defined, don't use it
252
return format_padding(repr(val), flags)
253
}
255
var ascii_format = function(val, flags) {
256
flags.pad_char = " " // even if 0 padding is defined, don't use it
257
return format_padding(ascii(val), flags)
258
}
260
// converts to val to float and sets precision if missing
261
var _float_helper = function(val, flags) {
262
number_check(val)
263
if (!flags.precision) {
264
if (!flags.decimal_point) {
265
flags.precision = 6
266
} else {
267
flags.precision = 0
268
}
269
} else {
270
flags.precision = parseInt(flags.precision, 10)
271
validate_precision(flags.precision)
272
}
273
return parseFloat(val)
274
}
276
// used to capture and remove trailing zeroes
277
var trailing_zeros = /(.*?)(0+)([eE].*)/
278
var leading_zeros = /\.(0*)/
279
var trailing_dot = /\.$/
281
var validate_precision = function(precision) {
282
// force precision to limits of javascript
283
if (precision > 20) {
284
throw _b_.ValueError("precision too big")
285
}
286
}
287
288
// gG
289
var floating_point_format = function(val, upper, flags) {
290
val = _float_helper(val, flags)
291
var v = val.toString()
292
var v_len = v.length
293
var dot_idx = v.indexOf('.')
294
if (dot_idx < 0) {
295
dot_idx = v_len
296
}
297
if (val < 1 && val > -1) {
298
var zeros = leading_zeros.exec(v)
299
var numzeros
300
if (zeros) {
301
numzeros = zeros[1].length
302
} else {
303
numzeros = 0
304
}
305
if (numzeros >= 4) {
306
val = format_sign(val, flags) + format_float_precision(val, upper, flags, _floating_g_exp_helper)
307
if (!flags.alternate) {
308
var trl = trailing_zeros.exec(val)
309
if (trl) {
310
val = trl[1].replace(trailing_dot, '') + trl[3] // remove trailing
316
}
317
return format_padding(val, flags)
318
}
319
flags.precision += numzeros
320
return format_padding(format_sign(val, flags) + format_float_precision(val, upper, flags,
321
function(val, precision) {
322
val = val.toFixed(min(precision, v_len - dot_idx) + numzeros)
323
}), flags)
324
}
325
326
if (dot_idx > flags.precision) {
327
val = format_sign(val, flags) + format_float_precision(val, upper, flags, _floating_g_exp_helper)
328
if (!flags.alternate) {
329
var trl = trailing_zeros.exec(val)
330
if (trl) {
331
val = trl[1].replace(trailing_dot, '') + trl[3] // remove trailing
332
}
333
} else {
334
if (flags.precision <= 1) {
335
val = val[0] + '.' + val.substring(1)
336
}
337
}
338
return format_padding(val, flags)
339
}
340
return format_padding(format_sign(val, flags) + format_float_precision(val, upper, flags,
341
function(val, precision) {
342
if (!flags.decimal_point) {
343
precision = min(v_len - 1, 6)
344
} else if (precision > v_len) {
345
if (!flags.alternate) {
346
precision = v_len
348
}
349
if (precision < dot_idx) {
350
precision = dot_idx
351
}
352
return val.toFixed(precision - dot_idx)
353
}), flags)
354
}
356
var _floating_g_exp_helper = function(val, precision, flags, upper) {
357
if (precision) {
358
--precision
359
}
360
val = val.toExponential(precision)
361
// pad exponent to two digits
362
var e_idx = val.lastIndexOf('e')
363
if (e_idx > val.length - 4) {
364
val = val.substring(0, e_idx + 2) + '0' + val.substring(e_idx + 2)
365
}
366
if (upper) {
367
return val.toUpperCase()
368
}
369
return val
370
}
371
372
// fF
373
var floating_point_decimal_format = function(val, upper, flags) {
374
val = _float_helper(val, flags)
375
return format_padding(format_sign(val, flags) + format_float_precision(val, upper, flags,
376
function(val, precision, flags) {
377
val = val.toFixed(precision)
378
if (precision === 0 && flags.alternate) {
379
val += '.'
380
}
381
return val
382
}), flags)
383
}
384
385
var _floating_exp_helper = function(val, precision, flags, upper) {
386
val = val.toExponential(precision)
387
// pad exponent to two digits
388
var e_idx = val.lastIndexOf('e')
389
if (e_idx > val.length - 4) {
390
val = val.substring(0, e_idx + 2) + '0' + val.substring(e_idx + 2)
391
}
392
if (upper) {
393
return val.toUpperCase()
394
}
395
return val
396
}
397
398
// eE
399
var floating_point_exponential_format = function(val, upper, flags) {
400
val = _float_helper(val, flags)
401
402
return format_padding(format_sign(val, flags) + format_float_precision(val, upper, flags, _floating_exp_helper), flags)
403
}
404
405
var signed_hex_format = function(val, upper, flags) {
408
409
if (val.__class__ === $B.LongInt.$dict) {
410
ret=$B.LongInt.$dict.to_base(val, 16)
411
} else {
412
ret = parseInt(val)
413
ret = ret.toString(16)
414
}
415
ret = format_int_precision(ret, flags)
416
if (upper) {
417
ret = ret.toUpperCase()
418
}
419
if (flags.pad_char === '0') {
420
if (val < 0) {
421
ret = ret.substring(1)
422
ret = '-' + format_padding(ret, flags, true)
423
}
424
var sign = format_sign(val, flags)
425
if (sign !== '') {
426
ret = sign + format_padding(ret, flags, true)
428
}
429
430
if (flags.alternate) {
431
if (ret.charAt(0) === '-') {
432
if (upper) {
433
ret = "-0X" + ret.slice(1)
434
} else {
435
ret = "-0x" + ret.slice(1)
436
}
437
} else {
438
if (upper) {
439
ret = "0X" + ret
440
} else {
441
ret = "0x" + ret
442
}
443
}
444
}
445
return format_padding(format_sign(val, flags) + ret, flags)
446
}
450
var ret
451
452
if (val.__class__ === $B.LongInt.$dict) {
453
ret = $B.LongInt.$dict.to_base(8)
454
} else {
455
ret = parseInt(val)
456
ret = ret.toString(8)
457
}
458
461
if (flags.pad_char === '0') {
462
if (val < 0) {
463
ret = ret.substring(1)
464
ret = '-' + format_padding(ret, flags, true)
465
}
466
var sign = format_sign(val, flags)
467
if (sign !== '') {
468
ret = sign + format_padding(ret, flags, true)
469
}
471
472
if (flags.alternate) {
473
if (ret.charAt(0) === '-') {
474
ret = "-0o" + ret.slice(1)
475
} else {
476
ret = "0o" + ret
477
}
479
return format_padding(ret, flags)
480
}
481
482
var single_char_format = function(val, flags) {
483
if(isinstance(val,str) && val.length==1) return val
484
try {
485
val = _b_.int(val) // yes, floats are valid (they are cast to int)
486
} catch (err) {
487
throw _b_.TypeError('%c requires int or char')
488
}
489
return format_padding(chr(val), flags)
490
}
491
492
var num_flag = function(c, flags) {
493
if (c === '0' && !flags.padding && !flags.decimal_point && !flags.left) {
494
flags.pad_char = '0'
495
return
496
}
497
if (!flags.decimal_point) {
498
flags.padding = (flags.padding || "") + c
499
} else {
500
flags.precision = (flags.precision || "") + c
501
}
502
}
503
504
var decimal_point_flag = function(val, flags) {
505
if (flags.decimal_point) {
506
// can only have one decimal point
507
throw new UnsupportedChar()
508
}
509
flags.decimal_point = true
510
}
511
512
var neg_flag = function(val, flags) {
513
flags.pad_char = ' ' // overrides '0' flag
514
flags.left = true
515
}
516
517
var space_flag = function(val, flags) {
518
flags.space = true
519
}
520
521
var sign_flag = function(val, flags) {
522
flags.sign = true
523
}
524
525
var alternate_flag = function(val, flags) {
526
flags.alternate = true
527
}
528
530
's': str_format,
531
'd': num_format,
532
'i': num_format,
533
'u': num_format,
534
'o': octal_format,
535
'r': repr_format,
536
'a': ascii_format,
537
'g': function(val, flags) {return floating_point_format(val, false, flags)},
538
'G': function(val, flags) {return floating_point_format(val, true, flags)},
539
'f': function(val, flags) {return floating_point_decimal_format(val, false, flags)},
540
'F': function(val, flags) {return floating_point_decimal_format(val, true, flags)},
541
'e': function(val, flags) {return floating_point_exponential_format(val, false, flags)},
542
'E': function(val, flags) {return floating_point_exponential_format(val, true, flags)},
543
'x': function(val, flags) {return signed_hex_format(val, false, flags)},
544
'X': function(val, flags) {return signed_hex_format(val, true, flags)},
545
'c': single_char_format,
546
'0': function(val, flags) {return num_flag('0', flags)},
547
'1': function(val, flags) {return num_flag('1', flags)},
548
'2': function(val, flags) {return num_flag('2', flags)},
549
'3': function(val, flags) {return num_flag('3', flags)},
550
'4': function(val, flags) {return num_flag('4', flags)},
551
'5': function(val, flags) {return num_flag('5', flags)},
552
'6': function(val, flags) {return num_flag('6', flags)},
553
'7': function(val, flags) {return num_flag('7', flags)},
554
'8': function(val, flags) {return num_flag('8', flags)},
555
'9': function(val, flags) {return num_flag('9', flags)},
556
'-': neg_flag,
557
' ': space_flag,
558
'+': sign_flag,
559
'.': decimal_point_flag,
560
'#': alternate_flag
561
}
562
563
// exception thrown when an unsupported char is encountered in legacy format
564
var UnsupportedChar = function() {
565
this.name = "UnsupportedChar"
566
}
567
579
++pos
580
var rslt = kwarg_key.exec(s.substring(newpos))
581
if (!rslt) {
582
throw _b_.ValueError("incomplete format key")
583
}
584
var key = rslt[1]
585
newpos += rslt[0].length
586
try {
588
} catch(err) {
589
if (err.name === "KeyError") {
590
throw err
591
}
592
throw _b_.TypeError("format requires a mapping")
593
}
608
}
609
catch(err) {
610
if (err.name === "IndexError") {
611
throw _b_.TypeError("not enough arguments for format string")
612
} else {
613
throw err
614
}
620
// todo: get flags, type
621
// todo: string value based on flags, type, value
622
var flags = {'pad_char': ' '}
623
do {
630
if (ret !== undefined) {
631
return ret
632
}
633
++newpos
634
}
635
} catch (err) {
636
if (err.name === "UnsupportedChar") {
637
invalid_char = s[newpos]
638
if (invalid_char === undefined) {
639
throw _b_.ValueError("incomplete format")
640
}
641
throw _b_.ValueError("unsupported format character '" + invalid_char +
642
"' (0x" + invalid_char.charCodeAt(0).toString(16) + ") at index " + newpos)
643
} else if (err.name === "NotANumber") {
644
var try_char = s[newpos]
651
}
652
} else {
653
cls = cls.__name__
654
}
655
throw _b_.TypeError("%" + try_char + " format: a number is required, not " + cls)
656
} else {
657
throw err
658
}
680
}
681
}
682
} else {
683
// % at end of string
684
throw _b_.ValueError("incomplete format")
685
}
686
pos = newpos + 1
687
} while (pos < length)
688
691
692
$StringDict.__mro__ = [$StringDict,$ObjectDict]
693
694
$StringDict.__mul__ = function(self,other){
695
if(!isinstance(other,_b_.int)){throw _b_.TypeError(
696
"Can't multiply sequence by non-int of type '"+
697
$B.get_class(other).__name__+"'")}
698
$res = ''
699
for(var i=0;i<other;i++){$res+=self.valueOf()}
700
return $res
701
}
702
703
$StringDict.__ne__ = function(self,other){return other!==self.valueOf()}
704
705
$StringDict.__repr__ = function(self){
706
var res = self.replace(/\n/g,'\\\\n')
707
// escape the escape char
708
res = res.replace(/\\/g, '\\\\')
709
if(res.search('"')==-1 && res.search("'")==-1){
710
return "'"+res+"'"
719
$StringDict.__setattr__ = function(self,attr,value){return setattr(self,attr,value)}
720
721
$StringDict.__setitem__ = function(self,attr,value){
722
throw _b_.TypeError("'str' object does not support item assignment")
723
}
724
$StringDict.__str__ = function(self){
725
if(self===undefined) return "<class 'str'>"
726
return self.toString()
727
}
728
$StringDict.toString = function(){return 'string!'}
729
730
// generate comparison methods
731
var $comp_func = function(self,other){
732
if(typeof other !=="string"){throw _b_.TypeError(
733
"unorderable types: 'str' > "+$B.get_class(other).__name__+"()")}
734
return self > other
735
}
736
$comp_func += '' // source code
737
var $comps = {'>':'gt','>=':'ge','<':'lt','<=':'le'}
738
for(var $op in $comps){
739
eval("$StringDict.__"+$comps[$op]+'__ = '+$comp_func.replace(/>/gm,$op))
740
}
741
742
// add "reflected" methods
743
$B.make_rmethods($StringDict)
744
745
// unsupported operations
746
var $notimplemented = function(self,other){
747
throw NotImplementedError("OPERATOR not implemented for class str")
748
}
749
750
$StringDict.capitalize = function(self){
751
if(self.length==0) return ''
752
return self.charAt(0).toUpperCase()+self.substr(1).toLowerCase()
753
}
754
755
$StringDict.casefold = function(self) {
756
throw _b_.NotImplementedError("function casefold not implemented yet");
757
}
758
759
$StringDict.center = function(self,width,fillchar){
760
if(fillchar===undefined){fillchar=' '}else{fillchar=fillchar}
761
if(width<=self.length) return self
762
763
var pad = parseInt((width-self.length)/2)
764
var res = Array(pad+1).join(fillchar) // is this statement faster than the for loop below?
765
res += self + res
766
if(res.length<width){res += fillchar}
767
return res
768
}
769
770
$StringDict.count = function(){
771
var $ = $B.args('count', 4, {self:null, sub:null, start:null, stop:null},
772
['self', 'sub', 'start', 'stop'], arguments, {start:0, stop:null},
773
null, null)
774
if(!(typeof $.sub==="string")){throw _b_.TypeError(
775
"Can't convert '"+$.sub.__class__.__name__+"' object to str implicitly")}
777
var n=0, pos=$.start
778
if($.stop===null){$.stop=$.self.length}
779
while(pos<$.stop){
780
pos=$.self.indexOf($.sub,pos)
781
if(pos>=0){ n++; pos+=$.sub.length} else break;
782
}
783
return n
784
}
785
786
$StringDict.encode = function(self, encoding) {
787
if (encoding === undefined) encoding='utf-8'
788
if(encoding=='rot13' || encoding=='rot_13'){
789
// Special case : returns a string
790
var res = ''
791
for(var i=0, _len = self.length; i<_len ; i++){
792
var char = self.charAt(i)
793
if(('a'<=char && char<='m') || ('A'<=char && char<='M')){
794
res += String.fromCharCode(String.charCodeAt(char)+13)
795
}else if(('m'<char && char<='z') || ('M'<char && char<='Z')){
796
res += String.fromCharCode(String.charCodeAt(char)-13)
797
}else{res += char}
798
}
799
return res
800
}
802
}
803
804
$StringDict.endswith = function(self){
805
// Return True if the string ends with the specified suffix, otherwise
806
// return False. suffix can also be a tuple of suffixes to look for.
807
// With optional start, test beginning at that position. With optional
808
// end, stop comparing at that position.
810
{self:null, suffix:null, start:null, end:null},
811
['self', 'suffix', 'start', 'end'],
812
arguments,{start:0, end:self.length-1},null,null)
813
var suffixes = $ns['suffix']
814
if(!isinstance(suffixes,_b_.tuple)){suffixes=[suffixes]}
819
suffix = suffixes[i]
820
if(suffix.length<=s.length &&
821
s.substr(s.length-suffix.length)==suffix) return true
822
}
823
return false
824
}
825
826
$StringDict.expandtabs = function(self, tabsize) {
827
tabsize=tabsize || 8
828
var _str=''
829
for (var i=0; i < tabsize; i++) _str+=' '
830
return self.valueOf().replace(/\t/g, _str)
831
}
832
833
$StringDict.find = function(self){
834
// Return the lowest index in the string where substring sub is found,
835
// such that sub is contained in the slice s[start:end]. Optional
836
// arguments start and end are interpreted as in slice notation.
837
// Return -1 if sub is not found.
838
var start=0,end=self.length
840
{self:null, sub:null, start:null, end:null},
841
['self', 'sub', 'start','end'],
842
arguments,{start:0, end:self.length},null,null)
843
for(var attr in $ns){eval('var '+attr+'=$ns[attr]')}
844
if(!isinstance(sub,str)){throw _b_.TypeError(
845
"Can't convert '"+sub.__class__.__name__+"' object to str implicitly")}
846
if(!isinstance(start,_b_.int)||!isinstance(end,_b_.int)){
847
throw _b_.TypeError(
848
"slice indices must be integers or None or have an __index__ method")}
849
var s = self.substring(start,end)
850
var esc_sub = ''
852
switch(sub.charAt(i)) {
853
case '[':
854
case '.':
855
case '*':
856
case '+':
857
case '?':
858
case '|':
859
case '(':
860
case ')':
861
case '$':
862
case '^':
863
esc_sub += '\\'
864
}
865
esc_sub += sub.charAt(i)
866
}
867
var res = s.search(esc_sub)
868
if(res==-1) return -1
869
return start+res
870
}
871
876
// Parse a "format string", as described in the Python documentation
877
// Return a format object. For the format string
878
// a.x[z]!r:...
879
// the object has attributes :
880
// - name : "a"
881
// - name_ext : [".x", "[z]"]
882
// - conv : r
883
// - spec : rest of string after :
885
var elts = fmt_string.split(':'), name, conv, spec, name_ext=[]
886
if(elts.length==1){
887
// No : in the string : it only contains a name
888
name = fmt_string
889
}else{
890
// name is before the first ":"
891
// spec (the format specification) is after
892
name = elts[0]
893
spec = elts.splice(1).join(':')
894
}
895
896
var elts = name.split('!')
897
if(elts.length>1){
898
name=elts[0]
899
conv=elts[1] // conversion flag
900
if(conv.length!==1 || 'ras'.search(conv)==-1){
901
throw _b_.ValueError('wrong conversion flag '+conv)
902
}
903
}
905
if(name!==undefined){
906
// "name' may be a subscription or attribute
907
// Put these "extensions" in the list "name_ext"
908
function name_repl(match){
909
name_ext.push(match)
910
return ''
911
}
912
var name_ext_re = /\.[_a-zA-Z][_a-zA-Z0-9]*|\[[_a-zA-Z][_a-zA-Z0-9]*\]|\[[0-9]+\]/g
913
name = name.replace(name_ext_re, name_repl)
914
}
923
arguments, {}, 'args', 'kw')
924
925
// Parse self to detect formatting instructions
926
// Create a list "parts" made of sections of the string :
927
// - elements of even rank are literal text
928
// - elements of odd rank are "format objects", built from the
929
// format strings in self (of the form {...})
930
var pos=0, _len=self.length, car, text='', parts=[], rank=0, defaults={}
931
932
while(pos<_len){
933
car = self.charAt(pos)
934
if(car=='{' && self.charAt(pos+1)=='{'){
935
// replace {{ by literal {
936
text += '{'
937
pos+=2
938
}else if(car=='}' && self.charAt(pos+1)=='}'){
939
// replace }} by literal }
940
text += '}'
941
pos+=2
942
}else if(car=='{'){
943
// Start of a format string
944
945
// Store current literal text
946
parts.push(text)
947
948
// Search the end of the format string, ie the } closing the
949
// opening {. Since the string can contain other pairs {} for
950
// nested formatting, an integer nb is incremented for each { and
951
// decremented for each } ; the end of the format string is
952
// reached when nb==0
953
var end = pos+1, nb=1
954
while(end<_len){
955
if(self.charAt(end)=='{'){nb++;end++}
956
else if(self.charAt(end)=='}'){
957
nb--;end++
958
if(nb==0){
959
// End of format string
960
var fmt_string = self.substring(pos+1, end-1)
961
962
// Create a format object, by function parse_format
963
var fmt_obj = parse_format(fmt_string)
964
965
// If no name is explicitely provided, use the rank
966
if(!fmt_obj.name){
967
fmt_obj.name=rank+''
968
rank++
969
}
972
// "spec" may contain "nested replacement fields"
973
// In this case, evaluate them using the keyword
974
// arguments passed to format()
975
function replace_nested(name, key){
978
}
979
fmt_obj.spec = fmt_obj.spec.replace(/\{(.+?)\}/g,
980
replace_nested)
981
}
982
983
// Store format object in list "parts"
984
parts.push(fmt_obj)
985
text = ''
986
break
987
}
988
}else{end++}
990
if(nb>0){throw ValueError("wrong format "+self)}
991
pos = end
992
}else{text += car;pos++}
996
// Apply formatting to the values passed to format()
997
var res = '', fmt
998
for(var i=0;i<parts.length;i++){
999
// Literal text is added unchanged
1000
if(typeof parts[i]=='string'){res += parts[i];continue}
1001
1002
// Format objects
1003
fmt = parts[i]
1004
if(fmt.name.charAt(0).search(/\d/)>-1){
1005
// Numerical reference : use positional arguments
1006
var pos = parseInt(fmt.name),
1007
value = _b_.tuple.$dict.__getitem__($.args, pos)
1008
}else{
1009
// Use keyword arguments
1010
var value = _b_.dict.$dict.__getitem__($.kw, fmt.name)
1011
}
1012
// If name has extensions (attributes or subscriptions)
1013
for(var j=0;j<fmt.name_ext.length;j++){
1014
var ext = fmt.name_ext[j]
1015
if(ext.charAt(0)=='.'){
1016
// Attribute
1017
value = _b_.getattr(value, ext.substr(1))
1018
}else{
1019
// Subscription
1020
var key = ext.substr(1, ext.length-2)
1021
// An index made of digits is transformed into an integer
1022
if(key.charAt(0).search(/\d/)>-1){key = parseInt(key)}
1023
value = _b_.getattr(value, '__getitem__')(key)
1024
}
1025
}
1026
// If the conversion flag is set, first call a function to convert
1027
// the value
1028
if(fmt.conv=='a'){value = _b_.ascii(value)}
1029
else if(fmt.conv=='r'){value = _b_.repr(value)}
1030
else if(fmt.conv=='s'){value = _b_.str(value)}
1031
1032
// Call attribute __format__ to perform the actual formatting
1033
res += _b_.getattr(value, '__format__')(fmt.spec)
1036
}
1037
1038
$StringDict.format_map = function(self) {
1039
throw NotImplementedError("function format_map not implemented yet");
1040
}
1041
1042
$StringDict.index = function(self){
1043
// Like find(), but raise ValueError when the substring is not found.
1044
var res = $StringDict.find.apply(self,arguments)
1045
if(res===-1) throw _b_.ValueError("substring not found")
1046
return res
1047
}
1048
1049
$StringDict.isalnum = function(self) {return /^[a-z0-9]+$/i.test(self)}
1050
1051
$StringDict.isalpha = function(self) {return /^[a-z]+$/i.test(self)}
1052
1053
$StringDict.isdecimal = function(self) {
1054
// this is not 100% correct
1055
return /^[0-9]+$/.test(self)
1056
}
1057
1058
$StringDict.isdigit = function(self) { return /^[0-9]+$/.test(self)}
1059
1060
$StringDict.isidentifier = function(self) {
1061
1062
switch(self) {
1063
case 'False':
1064
case 'None':
1065
case 'True':
1066
case 'and':
1067
case 'as':
1068
case 'assert':
1069
case 'break':
1070
case 'class':
1071
case 'continue':
1072
case 'def':
1073
case 'del':
1074
case 'elif':
1075
case 'else':
1076
case 'except':
1077
case 'finally':
1078
case 'for':
1079
case 'from':
1080
case 'global':
1081
case 'if':
1082
case 'import':
1083
case 'in':
1084
case 'is':
1085
case 'lambda':
1086
case 'nonlocal':
1087
case 'not':
1088
case 'or':
1089
case 'pass':
1090
case 'raise':
1091
case 'return':
1092
case 'try':
1093
case 'while':
1094
case 'with':
1095
case 'yield':
1096
return true
1097
}
1098
1099
// fixme.. this isn't complete but should be a good start
1100
return /^[a-z][0-9a-z_]+$/i.test(self)
1101
}
1102
1104
1105
// not sure how to handle unicode variables
1106
$StringDict.isnumeric = function(self) {return /^[0-9]+$/.test(self)}
1107
1108
// inspired by http://www.codingforums.com/archive/index.php/t-17925.html
1109
$StringDict.isprintable = function(self) {return !/[^ -~]/.test(self)}
1110
1111
$StringDict.isspace = function(self) {return /^\s+$/i.test(self)}
1112
1113
$StringDict.istitle = function(self) {return /^([A-Z][a-z]+)(\s[A-Z][a-z]+)$/i.test(self)}
1114
1116
1117
$StringDict.join = function(self,obj){
1118
var iterable=iter(obj)
1119
var res = '',count=0
1120
while(1){
1121
try{
1122
var obj2 = next(iterable)
1123
if(!isinstance(obj2,str)){throw _b_.TypeError(
1124
"sequence item "+count+": expected str instance, "+$B.get_class(obj2).__name__+" found")}
1125
res += obj2+self
1126
count++
1127
}catch(err){
1129
else{throw err}
1130
}
1131
}
1132
if(count==0) return ''
1133
return res.substr(0,res.length-self.length)
1134
}
1135
1136
$StringDict.ljust = function(self, width, fillchar) {
1137
if (width <= self.length) return self
1138
if (fillchar === undefined) fillchar=' '
1139
return self + Array(width - self.length + 1).join(fillchar)
1140
}
1141
1142
$StringDict.lower = function(self){return self.toLowerCase()}
1143
1144
$StringDict.lstrip = function(self,x){
1145
var pattern = null
1146
if(x==undefined){pattern="\\s*"}
1147
else{pattern = "["+x+"]*"}
1148
var sp = new RegExp("^"+pattern)
1149
return self.replace(sp,"")
1150
}
1151
1152
// note, maketrans should be a static function.
1153
$StringDict.maketrans = function(from, to) {
1154
var _t=[]
1155
// make 'default' translate table
1156
for(var i=0; i < 256; i++) _t[i]=String.fromCharCode(i)
1157
1158
// make substitution in the translation table
1160
var _ndx=from.source[i].charCodeAt(0) //retrieve ascii code of char
1161
_t[_ndx]=to.source[i]
1162
}
1163
1164
// create a data structure that string.translate understands
1168
}
1169
return _d
1170
}
1171
1172
$StringDict.partition = function(self,sep) {
1173
if (sep === undefined) {
1174
throw Error("sep argument is required");
1175
return
1176
}
1177
var i=self.indexOf(sep)
1178
if (i== -1) return _b_.tuple([self, '', ''])
1179
return _b_.tuple([self.substring(0,i), sep, self.substring(i+sep.length)])
1180
}
1181
1182
function $re_escape(str)
1183
{
1184
var specials = "[.*+?|()$^"
1186
var re = new RegExp('\\'+specials.charAt(i),'g')
1187
str = str.replace(re, "\\"+specials.charAt(i))
1188
}
1189
return str
1190
}
1191
1192
$StringDict.replace = function(self, old, _new, count) {
1193
// Replaces occurrences of 'old' by '_new'. Count references
1194
// the number of times to replace. In CPython, negative or undefined
1195
// values of count means replace all.
1196
if (count === undefined) {
1197
count = -1;
1198
} else {
1199
// Validate instance type of 'count'
1200
if (!isinstance(count,[_b_.int,_b_.float])) {
1201
throw _b_.TypeError("'" + str(count.__class__) + "' object cannot be interpreted as an integer");
1202
} else if (isinstance(count, _b_.float)) {
1203
throw _b_.TypeError("integer argument expected, got float");
1206
1207
var res = self.valueOf();
1208
var pos = -1;
1209
if (count < 0) count = res.length;
1210
while (count > 0) {
1211
pos = res.indexOf(old, pos);
1212
if (pos < 0)
1213
break;
1214
res = res.substr(0, pos) + _new + res.substr(pos + old.length);
1215
pos = pos + _new.length;
1216
count--;
1217
}
1218
return res;
1219
}
1220
1221
$StringDict.rfind = function(self){
1222
// Return the highest index in the string where substring sub is found,
1223
// such that sub is contained within s[start:end]. Optional arguments
1224
// start and end are interpreted as in slice notation. Return -1 on failure.
1226
{self:null, sub:null, start:null, end:null},
1227
['self', 'sub', 'start', 'end'],
1228
arguments,{start:0, end:self.length},null,null)
1229
for(var attr in $ns){eval('var '+attr+'=$ns[attr]')}
1230
if(!isinstance(sub,str)){throw _b_.TypeError(
1231
"Can't convert '"+sub.__class__.__name__+"' object to str implicitly")}
1232
if(!isinstance(start,_b_.int)||!isinstance(end,_b_.int)){throw _b_.TypeError(
1233
"slice indices must be integers or None or have an __index__ method")}
1234
1235
var s = self.substring(start,end)
1236
1237
// why not use lastIndexOf, which passes all brython tests..?
1238
return self.lastIndexOf(sub)
1239
}
1240
1241
$StringDict.rindex = function(){
1242
// Like rfind() but raises ValueError when the substring sub is not found
1243
var res = $StringDict.rfind.apply(this,arguments)
1244
if(res==-1){throw _b_.ValueError("substring not found")}
1245
return res
1246
}
1247
1248
$StringDict.rjust = function(self) {
1250
{self:null, width:null, fillchar:null},
1251
['self', 'width', 'fillchar'],
1252
arguments,{fillchar:' '},null,null)
1253
for(var attr in $ns){eval('var '+attr+'=$ns[attr]')}
1254
1255
if (width <= self.length) return self
1256
1257
return Array(width - self.length + 1).join(fillchar) + self
1258
}
1259
1260
$StringDict.rpartition = function(self,sep) {
1261
if (sep === undefined) {
1262
throw Error("sep argument is required");
1263
return
1264
}
1265
var pos=self.length-sep.length
1266
while(1){
1267
if(self.substr(pos,sep.length)==sep){
1268
return _b_.tuple([self.substr(0,pos),sep,self.substr(pos+sep.length)])
1269
}else{
1270
pos--
1271
if(pos<0){return _b_.tuple(['','',self])}
1272
}
1273
}
1274
}
1275
1276
$StringDict.rsplit = function(self) {
1277
var args = [], pos=0
1278
for(var i=1,_len_i=arguments.length;i<_len_i;i++){args[pos++]=arguments[i]}
1280
var sep=None,maxsplit=-1
1281
if($ns['args'].length>=1){sep=$ns['args'][0]}
1282
if($ns['args'].length==2){maxsplit=$ns['args'][1]}
1289
if (array.length <= maxsplit || maxsplit == -1) return array
1290
1291
var s=[]
1292
1293
s = array.splice(array.length - maxsplit, array.length)
1294
s.splice(0, 0, array.join(sep))
1295
1296
return s
1297
}
1298
1299
$StringDict.rstrip = function(self,x){
1300
if(x==undefined){var pattern="\\s*"}
1301
else{var pattern = "["+x+"]*"}
1302
sp = new RegExp(pattern+'$')
1303
return str(self.replace(sp,""))
1304
}
1305
1306
$StringDict.split = function(self){
1307
var args = [], pos=0
1308
for(var i=1,_len_i=arguments.length;i<_len_i;i++){args[pos++]=arguments[i]}
1310
var sep=None,maxsplit=-1
1311
if($ns['args'].length>=1){sep=$ns['args'][0]}
1312
if($ns['args'].length==2){maxsplit=$ns['args'][1]}
1313
maxsplit = _b_.dict.$dict.get($ns['kw'],'maxsplit',maxsplit)
1315
if(sep===None){
1316
var res = []
1317
var pos = 0
1318
while(pos<self.length&&self.charAt(pos).search(/\s/)>-1){pos++}
1320
var name = ''
1321
while(1){
1322
if(self.charAt(pos).search(/\s/)===-1){
1323
if(name===''){name=self.charAt(pos)}
1324
else{name+=self.charAt(pos)}
1325
}else{
1326
if(name!==''){
1327
res.push(name)
1328
if(maxsplit!==-1&&res.length===maxsplit+1){
1329
res.pop()
1330
res.push(name+self.substr(pos))
1331
return res
1332
}
1333
name=''
1334
}
1335
}
1336
pos++
1337
if(pos>self.length-1){
1338
if(name){res.push(name)}
1339
break
1340
}
1341
}
1342
return res
1343
}else{
1344
var esc_sep = ''
1349
case '.':
1350
case '[':
1351
case ']':
1352
case '(':
1353
case ')':
1354
case '|':
1355
case '$':
1356
case '^':
1357
esc_sep += '\\'
1358
}
1359
esc_sep += sep.charAt(i)
1360
}
1361
var re = new RegExp(esc_sep)
1362
if (maxsplit==-1){
1363
// use native Javascript split on self
1364
return self.valueOf().split(re,maxsplit)
1365
}
1366
1367
// javascript split behavior is different from python when
1368
// a maxsplit argument is supplied. (see javascript string split
1369
// function docs for details)
1370
var l=self.valueOf().split(re,-1)
1373
if (b.length > 0) a.push(b.join(sep))
1374
1375
return a
1376
}
1377
}
1378
1379
$StringDict.splitlines = function(self){return $StringDict.split(self,'\n')}
1380
1381
$StringDict.startswith = function(self){
1382
// Return True if string starts with the prefix, otherwise return False.
1383
// prefix can also be a tuple of prefixes to look for. With optional
1384
// start, test string beginning at that position. With optional end,
1385
// stop comparing string at that position.
1387
{self:null, prefix:null, start:null, end:null},
1388
['self', 'prefix', 'start', 'end'],
1389
arguments,{start:0, end:self.length-1},null,null)
1390
var prefixes = $ns['prefix']
1391
if(!isinstance(prefixes,_b_.tuple)){prefixes=[prefixes]}
1397
if (s.indexOf(prefixes[i]) == 0) return true
1398
}
1399
return false
1400
}
1401
1402
$StringDict.strip = function(self,x){
1403
if(x==undefined){x = "\\s"}
1404
return $StringDict.rstrip($StringDict.lstrip(self,x),x)
1405
}
1406
1407
$StringDict.swapcase = function(self) {
1408
//inspired by http://www.geekpedia.com/code69_Swap-string-case-using-JavaScript.html
1409
return self.replace(/([a-z])|([A-Z])/g, function($0,$1,$2)
1410
{ return ($1) ? $0.toUpperCase() : $0.toLowerCase()
1411
})
1412
}
1413
1414
$StringDict.title = function(self) {
1415
//inspired from http://stackoverflow.com/questions/196972/convert-string-to-title-case-with-javascript
1416
return self.replace(/\w\S*/g, function(txt){return txt.charAt(0).toUpperCase() + txt.substr(1).toLowerCase();});
1417
}
1418
1419
$StringDict.translate = function(self,table) {
1424
if(repl==-1){res[pos++]=self.charAt(i)}
1425
else if(repl!==None){res[pos++]=repl}
1429
}
1430
1431
$StringDict.upper = function(self){return self.toUpperCase()}
1432
1433
$StringDict.zfill = function(self, width) {
1434
if (width === undefined || width <= self.length || !self.isnumeric()) {
1435
return self
1436
}
1437
1438
return Array(width - self.length +1).join('0');
1439
}
1440
1441
function str(arg){
1442
if(arg===undefined) return ''
1443
switch(typeof arg) {
1444
case 'string': return arg
1445
case 'number': return arg.toString()
1446
}
1452
// class or its subclasses, but the attribute __str__ of the
1453
// class metaclass (usually "type") or its subclasses (usually
1454
// "object")
1455
// The metaclass is the attribute __class__ of the class dictionary
1456
var func = $B.$type.__getattribute__(arg.$dict.__class__,'__str__')
1461
var f = getattr(arg,'__str__')
1462
// XXX fix : if not better than object.__str__, try __repr__
1463
return f()
1464
}
1465
catch(err){
1471
if($B.debug>1){console.log(err)}
1472
console.log('Warning - no method __str__ or __repr__, default to toString', arg)
1474
}
1475
}
1476
}
1477
str.__class__ = $B.$factory
1478
str.$dict = $StringDict
1479
$StringDict.$factory = str
1480
$StringDict.__new__ = function(cls){
1481
if(cls===undefined){
1482
throw _b_.TypeError('str.__new__(): not enough arguments')
1483
}
1484
return {__class__:cls.$dict}
1485
}
1486
1489
// dictionary and factory for subclasses of string
1490
var $StringSubclassDict = {
1491
__class__:$B.$type,
1492
__name__:'str'
1493
}
1494
1495
// the methods in subclass apply the methods in $StringDict to the
1496
// result of instance.valueOf(), which is a Javascript string
1497
for(var $attr in $StringDict){
1498
if(typeof $StringDict[$attr]=='function'){
1499
$StringSubclassDict[$attr]=(function(attr){
1500
return function(){
1506
}
1507
}
1508
return $StringDict[attr].apply(null,args)
1509
}
1510
})($attr)
1511
}
1512
}
1513
$StringSubclassDict.__mro__ = [$StringSubclassDict,$ObjectDict]
1514
1515
// factory for str subclasses
1516
$B.$StringSubclassFactory = {
1517
__class__:$B.$factory,
1518
$dict:$StringSubclassDict
1519
}
1520
1521
_b_.str = str
1522
1523
// Function to parse the 2nd argument of format()
1524
$B.parse_format_spec = function(spec){
1534
if(spec.charAt(1) && aligns.indexOf(spec.charAt(1))!=-1){
1535
// If the second char is also an alignment specifier, the
1536
// first char is the fill value
1537
this.fill = spec.charAt(0)
1538
this.align = spec.charAt(1)
1539
pos = 2
1540
}else{
1541
// The first character defines alignment : fill defaults to ' '
1542
this.align=aligns[align_pos];
1543
this.fill=' ';
1544
pos++
1545
}
1546
}else{
1547
align_pos = aligns.indexOf(spec.charAt(1))
1548
if(spec.charAt(1) && align_pos!=-1){
1549
// The second character defines alignment : fill is the first one
1550
this.align=aligns[align_pos]
1551
this.fill=spec.charAt(0)
1552
pos = 2
1553
}
1554
}
1555
var car = spec.charAt(pos)
1556
if(car=='+'||car=='-'||car==' '){
1557
this.sign=car;
1558
pos++;
1559
car=spec.charAt(pos);
1562
if(car=='0'){
1563
// sign-aware : equivalent to fill=0 and align=='='
1564
this.fill='0'
1565
this.align = '='
1566
pos++;car=spec.charAt(pos)
1567
}
1569
if(this.width===undefined){this.width=car}
1570
else{this.width+=car}
1571
pos++;car=spec.charAt(pos)
1573
if(this.width!==undefined){this.width=parseInt(this.width)}
1574
if(car==','){this.comma=true;pos++;car=spec.charAt(pos)}
1575
if(car=='.'){
1576
if(digits.indexOf(spec.charAt(pos+1))==-1){
1577
throw _b_.ValueError("Missing precision in format spec")
1578
}
1579
this.precision = spec.charAt(pos+1)
1580
pos+=2;car=spec.charAt(pos)
1581
while(car && digits.indexOf(car)>-1){
1582
this.precision+=car;pos++;car=spec.charAt(pos)
1583
}
1584
this.precision = parseInt(this.precision)
1585
}
1586
if(car && types.indexOf(car)>-1){this.type=car;pos++;car=spec.charAt(pos)}
1587
if(pos!==spec.length){
1588
console.log('error', spec, this, pos, spec.charAt(pos))
1589
throw _b_.ValueError("Invalid format specifier")
1590
}
1591
}
1592
this.toString = function(){
1593
return (this.fill===undefined ? '' : _b_.str(this.fill))+
1594
(this.align||'')+
1595
(this.sign||'')+
1596
(this.alternate ? '#' : '')+
1597
(this.sign_aware ? '0' : '')+
1598
(this.width || '')+
1599
(this.comma ? ',' : '')+
1600
(this.precision ? '.'+this.precision : '')+
1601
(this.type || '')
1602
}
1603
}
1604
1605
$B.format_width = function(s, fmt){
1606
if(fmt.width && s.length<fmt.width){
1607
var fill=fmt.fill || ' ', align = fmt.align || '<',
1608
missing = fmt.width-s.length
1609
switch(align){
1610
case '<':
1611
return s+fill.repeat(missing)
1612
case '>':
1613
return fill.repeat(missing)+s
1614
case '=':
1615
if('+-'.indexOf(s.charAt(0))>-1){
1616
return s.charAt(0)+fill.repeat(missing)+s.substr(1)
1617
}else{
1618
return fill.repeat(missing)+s
1619
}
1620
case '^':
1621
left = parseInt(missing/2)