Skip to content

Instantly share code, notes, and snippets.

Created July 3, 2012 17:18
Show Gist options
  • Save anonymous/3041137 to your computer and use it in GitHub Desktop.
Save anonymous/3041137 to your computer and use it in GitHub Desktop.
<?
$content = file_get_contents("data.html");
preg_match_all("#<tr>\n(.*?)</tr>\n#s", $content, $person);
unset($person[1][0], $person[1][1]);
$person[1] = array_values($person[1]);
for ($i=0; $i < count($person[1]); $i++) {
$person[1][$i] = explode("\n", $person[1][$i]);
preg_match("#href=\"(.*?)\">#", $person[1][$i][2], $person[1][$i][4]);
$person[1][$i][4] = $person[1][$i][4][1];
$person[1][$i][0] = strip_tags($person[1][$i][0]);
$person[1][$i][1] = strip_tags($person[1][$i][1]);
$person[1][$i][2] = html_entity_decode(strip_tags($person[1][$i][2]));
$person[1][$i][3] = strip_tags($person[1][$i][3]);
$more_info = file_get_contents("https://apl.cnb.cz/apljerrsdad/" . html_entity_decode($person[1][$i][4]));
$person[1][$i][4] = array();
preg_match_all("#Typ subjektu</td>\n(.*?)</td>#s", $more_info, $typ_sub);
$person[1][$i][4][0] = strip_tags($typ_sub[1][0]);
preg_match_all("#Adresa sídla</td>\n(.*?)</td>#s", $more_info, $adr_sub);
$person[1][$i][4][1] = strip_tags($adr_sub[1][0]);
preg_match_all("#Kontaktní adresa</td>\n(.*?)</td>#s", $more_info, $adr_kon_sub);
$person[1][$i][4][2] = strip_tags($adr_kon_sub[1][0]);
preg_match_all("#Související vazby</td>\n(.*?)</td>#s", $more_info, $vazb_sub);
$person[1][$i][4][3] = array();
preg_match_all("#href=\"(.*?)\">#s", $vazb_sub[1][0], $vazb_sub_link);
for ($n=0; $n < count($vazb_sub_link[1]); $n++) {
$vazba = file_get_contents("https://apl.cnb.cz/apljerrsdad/" . html_entity_decode($vazb_sub_link[1][$n]));
preg_match_all("#<h5>Ve vazbě: (.*?)</h5>#s", $vazba, $vazb_jaka);
preg_match_all("#<tr>(.*?)</tr>#s", $vazba, $vazb_skym);
unset($vazb_skym[1][0], $vazb_skym[1][1]);
$vazb_skym[1] = array_values($vazb_skym[1]);
for ($o=0; $o < count($vazb_skym[1]); $o++) {
preg_match_all("#\">(.*?)</a>#s", $vazb_skym[1][$o], $vazb_skym_final);
$person[1][$i][4][3][] = array($vazb_skym_final[1][0], $vazb_jaka[1][0]);
}
}
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment