estoy tratando de hacer un programa el cual lea un archivo html, tratar el html y una vez tratado guardarlo en otro html.
ya logro leer el html y tratarlo, solo que al querer guardarlo en el archivo salida.html, me cambia
" por "e;
< por <
en general todos los simbolos que encierran las etiquetas en html.
este es el HTML
Código PHP:
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=iso-8859-1" />
<title>Lote E10000</title>
<META name="record1" content="E10000 R5000 00689e7d-da4b-4e6f-82a0-0e24c5174bfe.xml 2007-03-09 5403 JAVIER DE LA MORA MOVJ500731AE9">
<META name="record2" content="E10000 R5001 00e5800e-5bd2-4851-bf48-02220680f871.xml 2007-03-09 5394 JOSE ALFREDO LOPEZ PARRILLA LOPA721013XXX">
<META name="record3" content="E10000 R5002 00ee2815-ba4e-4718-b973-0d8a5a0a5951.xml 2007-03-09 5395 RICARDO OROZCO HUOR8005176BA">
<META name="record4" content="E10000 R5003 01041d18-8d60-4f8b-872b-b1ac927c1636.xml 2007-03-09 5460 JOSE ROMERO ROER790709DP0">
<META name="record5" content="E10000 R5004 018a20f5-13ac-4805-a82f-63509fd3533a.xml 2007-03-09 5768 LAURA RODEO820404CNA">
<style type="text/css">
<!--
.style1 {font-family: Verdana, Arial, Helvetica, sans-serif}
-->
</style>
</head>
<body>
<p> Lote<span class="style1">:</span>E10000 <br>
<font face="Verdana, Arial, Helvetica, sans-serif" size="-1">
</font></p>
<font face="Verdana, Arial, Helvetica, sans-serif" size="-1">
<table width="974" border="1" cellpadding="1" cellspacing="1">
<tr>
<td width="313" height="25" valign="top" bgcolor="#CCCCCC">Archivo XML</td>
<td width="167" valign="top" bgcolor="#CCCCCC">Fecha</td>
<td width="55" valign="top" bgcolor="#CCCCCC">folio</td>
<td width="55" valign="top" bgcolor="#CCCCCC">Id Emisor</td>
<td width="55" valign="top" bgcolor="#CCCCCC">Id Receptor</td>
<td width="255" valign="top" bgcolor="#CCCCCC"><p>receptor nombre </p></td>
<td width="156" valign="top" bgcolor="#CCCCCC">receptor rfc </td>
</tr>
<tr>
<td height="40" valign="top"><a href="00689e7d-da4b-4e6f-82a0-0e24c5174bfe.xml">00689e7d-da4b-4e6f-82a0-0e24c5174bfe.xml</a></td>
<td valign="top">2007-03-09T21:44:00</td>
<td valign="top">5403</td>
<td valign="top">E10000</td>
<td valign="top"> R5000 </td>
<td valign="top">JAVIER DE LA MORA </td>
<td valign="top">MOVJ<font size="-1" face="Verdana, Arial, Helvetica, sans-serif">50</font>0731AE9</td>
</tr>
<tr>
<td height="40" valign="top"><a href="00e5800e-5bd2-4851-bf48-02220680f871.xml">00e5800e-5bd2-4851-bf48-02220680f871.xml</a></td>
<td valign="top">2007-03-09T21:44:00 </td>
<td valign="top">5394</td>
<td valign="top">E10000</td>
<td valign="top"> R5001 </td>
<td valign="top">JOSE ALFREDO LOPEZ PARRILLA</td>
<td valign="top">LOPA72<font size="-1" face="Verdana, Arial, Helvetica, sans-serif">10</font>13XXX</td>
</tr>
<tr>
<td height="40" valign="top"><a href="00ee2815-ba4e-4718-b973-0d8a5a0a5951.xml">00ee2815-ba4e-4718-b973-0d8a5a0a5951.xml</a></td>
<td valign="top"> 2007-03-09T21:44:00 </td>
<td valign="top"> 5395 </td>
<td valign="top">E10000</td>
<td valign="top"> R5002 </td>
<td valign="top"> RICARDO OROZCO </td>
<td valign="top"> HUOR<font size="-1" face="Verdana, Arial, Helvetica, sans-serif">80</font>05176BA </td>
</tr>
<tr>
<td height="40" valign="top"><a href="01041d18-8d60-4f8b-872b-b1ac927c1636.xml">01041d18-8d60-4f8b-872b-b1ac927c1636.xml</a></td>
<td valign="top"> 2007-03-09T21:44:00 </td>
<td valign="top"> 5460 </td>
<td valign="top">E10000</td>
<td valign="top"> R5003 </td>
<td valign="top"> JOSE ROMERO </td>
<td valign="top"> ROER<font size="-1" face="Verdana, Arial, Helvetica, sans-serif">79</font>0709DP0 </td>
</tr>
<tr>
<td height="40" valign="top"><a href="018a20f5-13ac-4805-a82f-63509fd3533a.xml">018a20f5-13ac-4805-a82f-63509fd3533a.xml</a></td>
<td valign="top"> 2007-03-09T21:44:00 </td>
<td valign="top"> 5768 </td>
<td valign="top">E10000</td>
<td valign="top"> R5004 </td>
<td valign="top"> LAURA RODEO </td>
<td valign="top"> ROOL<font size="-1" face="Verdana, Arial, Helvetica, sans-serif">82</font>0404CNA </td>
</tr>
</table>
</font>
</body>
</html>
Código PHP:
<?php
$emisores=array('E10000','E10001','E10002','E10003','E10004','E10005','E10006','E10007','E10008','E10009');
$receptor=array('R5000','R5001','R5002','R5003','R5004');
$arch=file("10000_b.html");
$arch_sal=fopen("salida.html","w");
$cont=0;
foreach ($arch as $line_num => $line) {
$cad="";
$cad =htmlspecialchars($line);
$salida="";
for($i=0;$i<count($receptor);$i++){
if (eregi($receptor[$i],$cad)){
$div_cad=split(" ",$cad);
for($j=0;$j<count($div_cad);$j++){
if ($cont==5)$cont=0;
if ($div_cad[$j]==$receptor[$i]){
$cont++;
$div_rec=split('R',$receptor[$i]);
$div_cad[$j]= "R".($div_rec[1]+$cont)." ";
}
$salida.=$div_cad[$j]." ";
}
fputs($arch_sal,$salida);
break;
}else{
fputs($arch_sal,$cad);
break;
}
}
}
fclose($arch_sal);
?>
gracias