split用法如下:
scala> val s = "qw#ert#yu#u"
s: String = qw#ert#yu#u
scala> s.split("#")
res5: Array[String] = Array(qw, ert, yu, u)
public String[] split(String regex) { return split(regex, 0); }
public String[] split(String regex, int limit) { /* fastpath if the regex is a (1)one-char String and this character is not one of the RegEx's meta characters ".$|()[{^?*+\\", or (2)two-char String and the first char is the backslash and the second is not the ascii digit or ascii letter. */ char ch = 0; if (((regex.value.length == 1 && ".$|()[{^?*+\\".indexOf(ch = regex.charAt(0)) == -1) || //如果regex只有一位并且不是这几个特殊字符 (regex.length() == 2 && regex.charAt(0) == '\\' && (((ch = regex.charAt(1))-'0')|('9'-ch)) < 0 && ((ch-'a')|('z'-ch)) < 0 && ((ch-'A')|('Z'-ch)) < 0)) && //如果regex是两位,第一位是转义字符且第二位不是数字和字母 (ch < Character.MIN_HIGH_SURROGATE || ch > Character.MAX_LOW_SURROGATE)) //不属于utf-16字符 { int off = 0; int next = 0; boolean limited = limit > 0; ArrayList<String> list = new ArrayList<>(); while ((next = indexOf(ch, off)) != -1) { if (!limited || list.size() < limit - 1) { list.add(substring(off, next)); off = next + 1; } else { // last one //assert (list.size() == limit - 1); list.add(substring(off, value.length)); off = value.length; break; } } // If no match was found, return this if (off == 0) return new String[]{this}; // Add remaining segment if (!limited || list.size() < limit) list.add(substring(off, value.length)); // Construct result int resultSize = list.size(); if (limit == 0) { while (resultSize > 0 && list.get(resultSize - 1).length() == 0) { resultSize--; } } //去掉长度为0的字符即“” String[] result = new String[resultSize]; return list.subList(0, resultSize).toArray(result); } return Pattern.compile(regex).split(this, limit); }用python简单实现一下:
def split(target,regex):
off = 0
theNext = 0
res = []
while regex in target[off:]:
theNext = target.index(regex,off)
res.append(target[off:theNext])
off = theNext+1
res.append(target[off:])
return res
print(split("qq#ee#rr#t","#"))
> ['qq', 'ee', 'rr', 't']