2015-09-20 11:02:03 +00:00
|
|
|
name = "tripadvisor"
|
|
|
|
|
|
|
|
[index.items]
|
2015-09-20 06:31:21 +00:00
|
|
|
path = "a.property_title"
|
|
|
|
attr = "href"
|
|
|
|
|
2015-09-20 11:02:03 +00:00
|
|
|
[index.next]
|
2015-09-20 06:31:21 +00:00
|
|
|
path = "div.deckTools.btm a.nav.next.rndBtn.rndBtnGreen.taLnk"
|
|
|
|
attr = "href"
|
|
|
|
|
2015-09-20 11:02:03 +00:00
|
|
|
[item.name]
|
2015-09-20 06:31:21 +00:00
|
|
|
path = "h1#HEADING"
|
|
|
|
|
2015-09-20 11:02:03 +00:00
|
|
|
[item.address]
|
2015-09-20 06:31:21 +00:00
|
|
|
path = "address span.format_address > span:not(.extended-address)"
|
|
|
|
|
2015-09-20 11:02:03 +00:00
|
|
|
[item.weight]
|
2015-09-20 06:31:21 +00:00
|
|
|
path = "h3.reviews_header"
|
|
|
|
regex = "^(\d+)"
|
|
|
|
|
2015-09-20 11:02:03 +00:00
|
|
|
[item.semantics]
|
|
|
|
[item.semantics.service]
|
|
|
|
accomodating = 1.0
|
|
|
|
affordable = 0.0
|
|
|
|
atmospheric = 0.0
|
|
|
|
delicious: 0.0
|
|
|
|
scale = 5.0
|
|
|
|
|
2015-09-20 06:31:21 +00:00
|
|
|
path = "ul.barChart div.ratingRow img:nth-child(2)"
|
|
|
|
regex = "^([0-9]*\.?[0-9]+)"
|
|
|
|
attr = "alt"
|
|
|
|
|
2015-09-20 11:02:03 +00:00
|
|
|
[item.semantics.food]
|
|
|
|
accomodating = 0.0
|
|
|
|
affordable = 0.0
|
|
|
|
atmospheric = 0.0
|
|
|
|
delicious: 1.0
|
|
|
|
scale = 5.0
|
|
|
|
|
2015-09-20 06:31:21 +00:00
|
|
|
path = "ul.barChart div.ratingRow img:nth-child(1)"
|
|
|
|
regex = "^([0-9]*\.?[0-9]+)"
|
|
|
|
attr = "alt"
|
|
|
|
|
2015-09-20 11:02:03 +00:00
|
|
|
[item.semantics.value]
|
|
|
|
accomodating = 0.0
|
|
|
|
affordable = 1.0
|
|
|
|
atmospheric = 0.0
|
|
|
|
delicious: 0.0
|
|
|
|
scale = 5.0
|
|
|
|
|
2015-09-20 06:31:21 +00:00
|
|
|
path = "ul.barChart div.ratingRow img:nth-child(3)"
|
|
|
|
regex = "^([0-9]*\.?[0-9]+)"
|
|
|
|
attr = "alt"
|
|
|
|
|
2015-09-20 11:02:03 +00:00
|
|
|
[item.semantics.atmosphere]
|
|
|
|
accomodating = 0.0
|
|
|
|
affordable = 0.0
|
|
|
|
atmospheric = 1.0
|
|
|
|
delicious: 0.0
|
|
|
|
scale = 5.0
|
|
|
|
|
2015-09-20 06:31:21 +00:00
|
|
|
path = "ul.barChart div.ratingRow img:nth-child(4)"
|
|
|
|
regex = "^([0-9]*\.?[0-9]+)"
|
|
|
|
attr = "alt"
|