我正在为一个 特定领域语言。 (或DSL,),我正试图将一个字符串转换为全小写。我知道 toLowerCase
可以很容易地完成这个任务,但我需要将字符串用双引号或单引号("
或 '
)的原始情况。有关例子,请看下面。
输入:ThIs iS a teST "sTriNg Y'alL" aS yOu cAN sEE 'hEllO woRl\' o miNE'
输出:this is a test "sTriNg Y'alL" as you can see 'hEllO woRl\' o miNE'
EDIT: 添加了反斜线引号。
我只是做了一个快速的解析器,不知道它的效果如何,但它应该可以处理无限的反斜杠转义。
function string_to_block(str) {
var blocks = [],
i, j, k;
function isEscaped(str, i) {
var escaped = false;
while (str[--i] === '\\') escaped = !escaped;
return escaped;
}
start: for (i = 0; i < str.length; i = j + 1) {
find: for (j = i; j < str.length; ++j) {
if (str[j] === '"' && !isEscaped(str, j)) {
if (j > i) {
blocks.push({type: 'regular', str: str.slice(i, j)});
}
end: for (k = j + 1; k < str.length; ++k) {
if (str[k] === '"' && !isEscaped(str, k)) {
// found a "str" block
blocks.push({type: 'quote', str: str.slice(j, k + 1)});
j = k;
break find;
}
}
throw new SyntaxError('unclosed "str... starting at index ' + j);
}
if (str[j] === "'" && !isEscaped(str, j)) {
if (j > i) {
blocks.push({type: 'regular', str: str.slice(i, j)});
}
end: for (k = j + 1; k < str.length; ++k) {
if (str[k] === "'" && !isEscaped(str, k)) {
// found a 'str' block
blocks.push({type: 'quote', str: str.slice(j, k + 1)});
j = k;
break find;
}
}
throw new SyntaxError("unclosed 'str... starting at index " + j);
}
}
}
if (k + 1 < str.length) {
blocks.push({type: 'regular', str: str.slice(k + 1)});
}
return blocks;
}
现在
var foo = string_to_block("ThIs iS a teST \"sTriNg Y'alL\" aS yOu cAN sEE 'hEllO woRl\\' o miNE'");
/*
[
{"type": "regular", "str": "ThIs iS a teST "},
{"type": "quote" , "str": "\"sTriNg Y'alL\""},
{"type": "regular", "str": " aS yOu cAN sEE "},
{"type": "quote" , "str": "'hEllO woRl\\' o miNE'"}
]
*/
所以我们可以根据需要重新构建你的字符串。
var i, str = '';
for (i = 0; i < foo.length; ++i) {
if (foo[i].type === 'regular') str += foo[i].str.toLowerCase();
else str += foo[i].str;
}
str; // this is a test "sTriNg Y'alL" as you can see 'hEllO woRl\' o miNE'
我相信有一个regex的解决方案, 但这里是另一种解决方案,取代引号字符串 之前,它的小写。
String.prototype.toLowerCaseQuoted = function() {
var str = this.valueOf();
var replacements = [];
var I = 0;
str = str
.replace(/((\".+\")|(\'.+\'))/g, function(s) {
console.log(s)
replacements.push(s);
return "%s"+(I++)+"%"
})
.toLowerCase()
.replace(/%s([0-9]+)%/g, function(s) {
var k = parseInt(s.match(/([0-9])+/)[0]);
console.log(k)
return replacements[k];
});
return str;
}
例如:
"WILL BE LOWER CASE \"QUOTED\" \'MORE QUOTED\'".toLowerCaseQuoted()
例如:"will be lower case "QUOTED" 'MORE QUOTED'"
String.prototype.toLowerCaseQuoted = function() {
var oldValue = this.valueOf();
var newValue = '';
var inside = 0;
for (var i = 0; i < oldValue.length; i++) {
if (oldValue[i] == '"') {
if (inside == 0) {
inside = 1;
} else {
inside = 0;
}
}
if (inside == 1) {
newValue += oldValue[i];
} else {
newValue += oldValue[i].toLowerCase();
}
}
return newValue;
}