From de5a009dc1fb2f58a0e2aed98d803cad0d29b4f2 Mon Sep 17 00:00:00 2001 From: Anatoly Kopyl Date: Mon, 23 Nov 2020 15:06:01 +0300 Subject: [PATCH] Initial commit --- scraper.sh | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) create mode 100755 scraper.sh diff --git a/scraper.sh b/scraper.sh new file mode 100755 index 0000000..4e8c0c5 --- /dev/null +++ b/scraper.sh @@ -0,0 +1,19 @@ +#!/bin/bash + +UA="User-Agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_3) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/44.0.2403.89 Safari/537.36" +list=$(curl -H "$UA" -L 'https://www.avito.ru/sankt-peterburg/telefony/iphone-ASgBAgICAUSeAt4J?bt=1&cd=1&i=1&q=iphone+7&s=104' | +grep -A1 'data-marker="item-title"' | +grep href | +sed 's|href="|http://avito.ru|g' | sed 's|"||g') + +echo "$list" | while read -r url +do + curl -s -H "$UA" -L $url | + grep 'itemprop="price"' | + ggrep -oP '(?<=content=").*?(?=")' | + head -1 + + echo $url + + sleep 12; +done \ No newline at end of file