-
Notifications
You must be signed in to change notification settings - Fork 19
snippets
Debianguru edited this page Oct 6, 2013
·
8 revisions
This site collects xpath/regex snippets for some websites. You might add them to your config.py file.
Please feel free to contribute and to add your own snippet...!
* www.solar-log.com (SolarLog 1000)
'shortname': 'SolarLog',
'uri': 'http://www.solar-log.com/typo3conf/ext/getfirmware/getfirmware.php?s=3&logid=7&wrid=999&lng=DE',
'contentxpath': '//body/*'
* 'shortname': 'rockbox',
'uri': 'http://www.rockbox.org/download/',
'contentxpath': '//h1',
* willuhn.de/products/hibiscus
'shortname': 'jameica',
'uri': 'http://willuhn.de/products/hibiscus/',
'contentxpath': '//*[@id=\'content\']/div[contains(concat(\' \', normalize-space(@class), \' \'), \'news\')]',
'encoding': 'iso-8859-1'},
* calibre-ebook.com
'shortname': 'calibre',
'uri': 'http://calibre-ebook.com/download_linux',
'contentxpath': '//*[@id=\'content\']/p',
'contentregex': 'The latest release of calibre is .*',
* Acer S3 Firmware
'shortname': 'LaptopFirmware',
'uri': 'http://www.acer.com/wjws/ws/gdp/files/en/US/-/latest/bios/4088?_jsonp=FilesDataServiceCallBack_12&t=1368263488751',
'contentregex': 'Version\"\:\d*\.\d*',
* openwrt.org
'shortname': 'OpenWrt',
'uri': 'https://openwrt.org/index.php',
'contentxpath': '//*[contains(concat(\' \', normalize-space(@class), \' \'), \' content \')]',
* Kindle Touch Firmware
'shortname': 'kindleFirmware',
'uri': 'http://www.amazon.com/gp/help/customer/display.html/ref=hp_left_sib?ie=UTF8&nodeId=200790650',
'contentxpath': '//*[@id=\'GUID-3038BDB9-2F50-433B-815E-9160D1C8572E__GUID-5D35F37A-8103-4C6E-B1AB-2FDDE21A8BE0\']',
* www.edimax.com repeater
'shortname': 'edimax',
'uri': 'http://www.edimax.com/en/support_detail.php?pd_id=404&pl1_id=1',
'contentxpath': '//*[@id=\'container\']',
* Munich Highlights
'shortname': 'MUC_Highlights',
'uri': 'http://www.muenchen.de/veranstaltungen/events/highlightsdesjahres.html',
'contentxpath': '//div[@id=\'main\']/div[@class=\'block\']',
* Munich satirical shows
'shortname': 'MUC_Kabarett',
'uri': 'http://www.muenchen.de/veranstaltungen/events/kabarett.html',
'contentxpath': '//*[contains(concat(\' \', normalize-space(@class), \' \'), \' elitem \')]',
* Munich theatre
'shortname': 'MUC_Theater',
'uri': 'http://www.muenchen.de/veranstaltungen/events/theater.html',
'contentxpath': '//*[contains(concat(\' \', normalize-space(@class), \' \'), \' elitem \')]',
* www.hetzner.de
'shortname': 'Hetzner',
'uri': 'http://www.hetzner.de/hosting/news/news-home',
'titlexpath': "//*[@id='content-noright']/h4[position()>1]",
'contentxpath': "//*[@id='content-noright']/p[position()>1]"