JAVA正则表达式中的正斜杠

时间:2013-02-12 16:36:41

标签: java regex escaping slash

概况: 使用String.matches(“string”)时,我在使用“/”时遇到一些问题; 我假设我错过了某种程度的逃避。

matches("bar" + "[\\W\\w]*"); //works.
matches("bar/" + "[\\W\\w]*"); //does not work.
matches("bar\/" + "[\\W\\w]*"); //errors
matches("bar\\/" + "[\\W\\w]*"); //does not work
matches("bar\\\\/" + "[\\W\\w]*"); //does not work

我错过了什么?

确切情况:

private static final String CHECK_TABLE_PRE = "<table class=\"data playerStats\">\n <thead>\n  <tr>\n   <th colspan=\"1\" rowspan=\"1\">&nbsp;</th>\n   <th colspan=\"1\" rowspan=\"1\">G</th>\n   <th colspan=\"1\" rowspan=\"1\">A</th>\n   <th colspan=\"1\" rowspan=\"1\">P</th>\n   <th colspan=\"1\" rowspan=\"1\">+/-</th>\n   <th colspan=\"1\" rowspan=\"1\">PIM</th>\n   <th colspan=\"1\" rowspan=\"1\">PPG</th>\n   <th colspan=\"1\" rowspan=\"1\">SHG</th>\n   <th colspan=\"1\" rowspan=\"1\">S</th>\n   <th colspan=\"1\" rowspan=\"1\">S%</th>\n   <th colspan=\"1\" rowspan=\"1\">Shifts</th>\n   <th colspan=\"1\" rowspan=\"1\">TOI</th>\n   <th colspan=\"1\" rowspan=\"1\">FO%</th>\n  </tr>\n</thead>\n<tbody>\n  <tr>";  //want to use this, but the "/" makes it fail
private static final String CHECK_TABLE_POST = "  </tr>\n </tbody>\n</table>"; //Both gotten by copy/pasting from the console.
System.out.println(table.outerHtml().matches("<table class=\"data playerStats\">\n <thead>\n  <tr>\n   <th colspan=\"1\" rowspan=\"1\">&nbsp;</th>\n   <th colspan=\"1\" rowspan=\"1\">G</th>\n   <th colspan=\"1\" rowspan=\"1\">A</th>\n   <th colspan=\"1\" rowspan=\"1\">+" + "[\\W\\w]*" + CHECK_TABLE_POST));
//This works, but I cannot add a add the "/" without getting it to fail.

//Where table = Jsoup.connect("http://www.nhl.com/ice/player.htm?view=log&id=8470598").get().select("table.data.playerStats").get(0);

好的,这是一个更小的更自包含的例子:

String test = "<table class=\"data playerStats\">\n <thead>\n  <tr>\n   <th colspan=\"1\" rowspan=\"1\">&nbsp;</th>\n   <th colspan=\"1\" rowspan=\"1\">G</th>\n   <th colspan=\"1\" rowspan=\"1\">A</th>\n   <th colspan=\"1\" rowspan=\"1\">P</th>\n   <th colspan=\"1\" rowspan=\"1\">+/-</th>\n   <th colspan=\"1\" rowspan=\"1\">PIM</th>\n   <th colspan=\"1\" rowspan=\"1\">PPG</th>\n   <th colspan=\"1\" rowspan=\"1\">SHG</th>\n   <th colspan=\"1\" rowspan=\"1\">S</th>\n   <th colspan=\"1\" rowspan=\"1\">S%</th>\n   <th colspan=\"1\" rowspan=\"1\">Shifts</th>\n   <th colspan=\"1\" rowspan=\"1\">TOI</th>\n   <th colspan=\"1\" rowspan=\"1\">FO%</th>\n  </tr>\n </thead>\n <tbody>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020168\"> Feb 10 '13 </a> BOS @ BUF</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">-1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>0.0</span></td>\n   <td colspan=\"1\" rowspan=\"1\">22</td>\n   <td colspan=\"1\" rowspan=\"1\">15:23</td>\n   <td colspan=\"1\" rowspan=\"1\"></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020161\"> Feb 9 '13 </a> BUF @ NYI</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">3</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>33.3</span></td>\n   <td colspan=\"1\" rowspan=\"1\">26</td>\n   <td colspan=\"1\" rowspan=\"1\">21:47</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>100.00</span></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020141\"> Feb 7 '13 </a> MTL @ BUF</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">-1</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">8</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>25.0</span></td>\n   <td colspan=\"1\" rowspan=\"1\">25</td>\n   <td colspan=\"1\" rowspan=\"1\">23:56</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>100.00</span></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020132\"> Feb 5 '13 </a> BUF @ OTT</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">-1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>0.0</span></td>\n   <td colspan=\"1\" rowspan=\"1\">23</td>\n   <td colspan=\"1\" rowspan=\"1\">20:15</td>\n   <td colspan=\"1\" rowspan=\"1\"></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020121\"> Feb 3 '13 </a> FLA @ BUF</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">3</td>\n   <td colspan=\"1\" rowspan=\"1\">3</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>100.0</span></td>\n   <td colspan=\"1\" rowspan=\"1\">24</td>\n   <td colspan=\"1\" rowspan=\"1\">19:15</td>\n   <td colspan=\"1\" rowspan=\"1\"></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020109\"> Feb 2 '13 </a> BUF @ MTL</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">4</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>25.0</span></td>\n   <td colspan=\"1\" rowspan=\"1\">19</td>\n   <td colspan=\"1\" rowspan=\"1\">17:20</td>\n   <td colspan=\"1\" rowspan=\"1\"></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020092\"> Jan 31 '13 </a> BUF @ BOS</td>\n   <td colspan=\"1\" rowspan=\"1\">3</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">5</td>\n   <td colspan=\"1\" rowspan=\"1\">4</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">4</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>75.0</span></td>\n   <td colspan=\"1\" rowspan=\"1\">21</td>\n   <td colspan=\"1\" rowspan=\"1\">19:21</td>\n   <td colspan=\"1\" rowspan=\"1\"></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020079\"> Jan 29 '13 </a> TOR @ BUF</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">-1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">4</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>0.0</span></td>\n   <td colspan=\"1\" rowspan=\"1\">27</td>\n   <td colspan=\"1\" rowspan=\"1\">23:01</td>\n   <td colspan=\"1\" rowspan=\"1\"></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020051\"> Jan 25 '13 </a> CAR @ BUF</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">-1</td>\n   <td colspan=\"1\" rowspan=\"1\">6</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">6</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>16.7</span></td>\n   <td colspan=\"1\" rowspan=\"1\">22</td>\n   <td colspan=\"1\" rowspan=\"1\">17:55</td>\n   <td colspan=\"1\" rowspan=\"1\"></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020043\"> Jan 24 '13 </a> BUF @ CAR</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">-1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>0.0</span></td>\n   <td colspan=\"1\" rowspan=\"1\">21</td>\n   <td colspan=\"1\" rowspan=\"1\">18:45</td>\n   <td colspan=\"1\" rowspan=\"1\"></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020023\"> Jan 21 '13 </a> BUF @ TOR</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">3</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>0.0</span></td>\n   <td colspan=\"1\" rowspan=\"1\">23</td>\n   <td colspan=\"1\" rowspan=\"1\">18:52</td>\n   <td colspan=\"1\" rowspan=\"1\"></td>\n  </tr>\n  <tr>\n   <td colspan=\"1\" rowspan=\"1\"><a class=\"undMe\" href=\"/ice/recap.htm?id=2012020014\"> Jan 20 '13 </a> PHI @ BUF</td>\n   <td colspan=\"1\" rowspan=\"1\">2</td>\n   <td colspan=\"1\" rowspan=\"1\">3</td>\n   <td colspan=\"1\" rowspan=\"1\">5</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">1</td>\n   <td colspan=\"1\" rowspan=\"1\">0</td>\n   <td colspan=\"1\" rowspan=\"1\">9</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>22.2</span></td>\n   <td colspan=\"1\" rowspan=\"1\">26</td>\n   <td colspan=\"1\" rowspan=\"1\">19:17</td>\n   <td colspan=\"1\" rowspan=\"1\"><span>100.00</span></td>\n  </tr>\n </tbody>\n</table>";
System.out.println(test.matches("<table class=\"data playerStats\">\n <thead>\n  <tr>\n   <th colspan=\"1\" rowspan=\"1\">&nbsp;</th>\n   [\\w\\W]*"));
System.out.println(test.matches("<table class=\"data playerStats\">\n <thead>\n  <tr>\n   <th colspan=\"1\" rowspan=\"1\">&nbsp;</th>\n   <th colspan=\"1\" rowspan=\"1\">G</th>\n   <th colspan=\"1\" rowspan=\"1\">A</th>\n   <th colspan=\"1\" rowspan=\"1\">P</th>\n   <th colspan=\"1\" rowspan=\"1\">+/-[\\w\\W]*"));
System.out.println(test.matches(test));

//Console return "true \n false \n false" (without the spaces).
好的,在这里忍受我。更短的例子:

String test = "foo+/-bar";
System.out.println(test.matches("foo+[\\w\\W]*"));
System.out.println(test.matches("foo+/[\\w\\W]*"));
System.out.println(test.matches("foo+/-bar[\\w\\W]*"));
System.out.println(test.matches(test));
//true false false false
//But if I leave out the +-, so that String test = "foo/bar"; (and change the rest of the example accordingly) the whole example work (returns true).

所以,“+ /”有些奇怪。也许我必须逃避加号。

2 个答案:

答案 0 :(得分:7)

无需在JAVA中转义/

matches() 自动锚点 *包含^$的模式。

".*bar/.*"应该符合您的需求。


* String#matches()调用Pattern#matches(),调用Matcher#matches()which explains that true返回,当且仅当整个区域序列匹配时这个匹配器的模式

答案 1 :(得分:1)

  

所以,“+ /”有些奇怪。也许我必须逃避加号。

是的,你这样做。正则表达式中的+表示前面的一个或多个内容,因此为了匹配文字加号,您需要在正则表达式中使用\+,这意味着Java字符串文字中的\\+ < / p>

test.matches("foo\\+/-bar[\\w\\W]*"