url |
^https?://(www\.)?47news\.jp/. |
nextLink |
(//div[@class='topContent']|//p[contains(@class,'pageNate')])/text()[string-length(.)>3]/following-sibling::a|//a[img/@alt='次へ']|id('bt_body')/a|id('mainContent')//div[@align='center']/a[img[contains(@src,'next')]]|id('mainContent')//p[@class='pageNate in_the_box10_b']/text()[not(a)][number(translate(self::text(),'|','')) ]/following-sibling::a[1]|id('mainContent')//li[@class='next']/a|id('mainBlueBoxCenter')//div[@class=' clear pageNateBox font14']/a[last()]|id('next')/a |
pageElement |
(//div[@class='topContent']|//p[contains(@class,'pageNate')])/node()[string-length(.)>3 or self::span]/following-sibling::a|//a[img/@alt='次へ']|id('bt_body')/a|id('mainContent')//div[@align='center']/a[img[contains(@src,'next')]]|id('mainContent')//p[@class='pageNate in_the_box10_b']/text()[not(a)][number(translate(self::text(),'|','')) ]/following-sibling::a[1]|id('mainContent')//li[@class='next']/a|id('mainBlueBoxCenter')//div[@class=' clear pageNateBox font14']/a[last()]|id('next')/a |
exampleUrl |
http://www.47news.jp/news/2009/11/post_20091114161204.html
http://www.47news.jp/news/sports_photogallery_sokuho.php?page=1
http://www.47news.jp/sports/baseball/photo/photo_news_headline.php
http://www.47news.jp/sports/baseball/photo/photogallery_headline.php
http://www.47news.jp/photo/sports/
http://www.47news.jp/news/photonews/2013/02/post_20130209104501.php
http://www.47news.jp/sports/baseball/archives_baseball_headline.php
http://www.47news.jp/sports/baseball/archives_baseball_headline.php?page=2
http://www.47news.jp/news/archives_sportssokuho.php
http://www.47news.jp/news/archives_sportssokuho.php?page=2 |