url |
^http://www\.observer\.com/ |
nextLink |
id("main_content")/div[contains(concat(" ", @class, " "), " article_paging ")]/a[not(position()=normalize-space())][1]|//li[@class="pager-next"]/a |
pageElement |
id("article_container")/*|id("channel-nodes channel-blog-nodes")/*[not(@class="blog-ad" or @class="item-list")]|id("gsearch_blitt gsearch_box")/following-sibling::div[@class="list_item"] |
exampleUrl |
http://www.observer.com/2008/would-you-take-tumblr-man
http://www.observer.com/daily-transom
http://www.observer.com/opinion
http://www.observer.com/site-search?keys=obama&sa.x=0&sa.y=0&sa=Submit
http://www.observer.com/site-search?page=1&keys=obama&sa_x=0&sa_y=0&sa=Submit |