-
Notifications
You must be signed in to change notification settings - Fork 0
/
scraper.php
53 lines (46 loc) · 1.46 KB
/
scraper.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
<?php
require 'scraperwiki.php';
require 'scraperwiki/simple_html_dom.php';
$page_counter = 0;
$next_page = FALSE;
//do {
$kovetkezo = "";
$page_counter++;
$pageurl = "http://www.hasznaltauto.hu/partner/ber-car_autokereskedes-448/page{$page_counter}";
$html_content = scraperWiki::scrape($pageurl);
$html = str_get_html($html_content);
foreach ($html->find("div.talalati_lista") as $talalat) {
foreach ($talalat->find("h2 a") as $el) {
$tipus = $el->innertext;
$url = $el->href;
$kod = substr($url, -7);
}
foreach ($talalat->find("div.talalati_lista_vetelar strong") as $ar) {
$ar = str_replace(" ", " ", $ar->innertext);
}
foreach ($talalat->find("div.talalati_lista_infosor") as $info) {
print_r($info);
$info = str_replace("–", ",", $info->innertext);
$info = str_replace(" ", " ", $info);
$info = str_replace("³", "3", $info);
$info = explode(",",$info);
}
scraperwiki::save(
array('id'),
array(
'id' => $kod,
'type' => $el->innertext,
'price' => $ar,
/* 'year' => $info[0],
'benzin' => $info[1],
'hub' => $info[2],
'power' => $info[3],*/
'url' => $url,
)
);
}
/* foreach ($html->find("div.oldalszamozas a[title=Következő]") as $kovetkezo) {
print $page_counter . "\n";
}*/
//} while ($kovetkezo != "");
?>