-
Notifications
You must be signed in to change notification settings - Fork 4
/
rime.inc
31 lines (28 loc) · 1.76 KB
/
rime.inc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
<?php
function rime($parola, $FileNameXml){
shell_exec("curl http://www.cercarime.it/?rima=" . $parola . " > scraping.html");
$string = "curl --data-binary @scraping.html -H \"Content-Type: text/html\" http://www.it.uc3m.es/jaf/cgi-bin/html2xhtml.cgi > scraping.xhtml";
shell_exec($string);
#parsing del documento per togliere eventuali caratteri che fanno sbombare il DOM
//file_put_contents("scraping.xhtml", str_replace("©", "", file_get_contents("scraping.xhtml")));
//file_put_contents("scraping.xhtml", str_replace("é", "è", file_get_contents("scraping.xhtml")));
$xml = simplexml_load_file("scraping.xhtml");
$rime = $xml->xpath("//*[name()='div']/*[name()='div'][1]/*[name()='ul'][1]/*[name()='li']/*[name()='p']/*[name()='i']/*[name()='a']/text()");
if(count($rime)==0){
file_put_contents($FileNameXml,"\t<rime>\n", FILE_APPEND);
file_put_contents($FileNameXml,"\t\t<warning>\n", FILE_APPEND);
file_put_contents($FileNameXml,"\t\t\t Nessuna rima trovata \n" , FILE_APPEND);
file_put_contents($FileNameXml,"\t\t</warning>\n" , FILE_APPEND);
file_put_contents($FileNameXml,"\t</rime>\n" , FILE_APPEND);
}
else{
file_put_contents($FileNameXml,"\t<rime>\n", FILE_APPEND);
foreach ($rime as $value) {
file_put_contents($FileNameXml,"\t\t<rima>\n" , FILE_APPEND);
file_put_contents($FileNameXml,"\t\t\t" . $value . "\n" , FILE_APPEND);
file_put_contents($FileNameXml,"\t\t</rima>\n" , FILE_APPEND);
}
file_put_contents($FileNameXml,"\t</rime>\n" , FILE_APPEND);
}
}
?>