1 title: //h1/following::span[@class='fn']
2 # Author: should stop parsing until <br> reached, but I don't know how to do this.
3 author: //following::div[@class='PDate2']
4 date: //following::div[@class='PDate2']/strong
6 body: //div[@class='ArTexte']
7 body: //div[@id='prod_txt_b']
8 body: //div[@class='ArPhotoP']
9 test_url: http://www.lesnumeriques.com/disque-dur-multimedia/popcorn-hour-300-p12231/test.html