Rev 14815 | Rev 17234 | Go to most recent revision | Show entire file | Ignore whitespace | Details | Blame | Last modification | View Log | RSS feed
Rev 14815 | Rev 17170 | ||
---|---|---|---|
Line 12... | Line 12... | ||
12 | open (IN ,$file) ; |
12 | open (IN ,$file) ; |
13 | my $text = <IN>; |
13 | my $text = <IN>; |
14 | ##multiple <p> |
14 | ##multiple <p> |
15 | $text =~ s:(<p>\s*){2,}:<p>:g; |
15 | $text =~ s:(<p>\s*){2,}:<p>:g; |
16 | ## close br and hr |
16 | ## close br and hr |
17 | $text =~ s:<(b|h)r\s*>:<$1r |
17 | $text =~ s:<(b|h)r\s*>:<$1r>:g; |
18 | ## delete multiple <br> |
18 | ## delete multiple <br> |
19 | $text =~ s:(<br\s*/>\s*){2,}:< |
19 | $text =~ s:(<br\s*/>\s*){2,}:<br>:g; |
20 | $text =~ s:(<p>\s*){1,}(<li>|</?ul>|</?ol>):$2:g; |
20 | $text =~ s:(<p>\s*){1,}(<li>|</?ul>|</?ol>):$2:g; |
21 | ## delete <br> before <li></?ul></?ol> |
21 | ## delete <br> before <li></?ul></?ol> |
22 | $text =~ s:(<br\s*/?>\s*){1,}(<h[1-5].*>|<li|</h[1-5]>|</?ul>|</?ol>):$2:g; |
22 | $text =~ s:(<br\s*/?>\s*){1,}(<h[1-5].*>|<li|</h[1-5]>|</?ul>|</?ol>):$2:g; |
23 | ## delete <li> empty |
23 | ## delete <li> empty |
24 | $text =~ s:(<li>\s*){1,}</(u|o)l>:</$2l>:g; |
24 | $text =~ s:(<li>\s*){1,}</(u|o)l>:</$2l>:g; |
25 | ## transform some hr |
25 | ## transform some hr |
26 | $text =~ s|<hr\s+width="(\d+)%"\s*/?/>|<hr style="width:$1%" |
26 | $text =~ s|<hr\s+width="(\d+)%"\s*/?/?>|<hr style="width:$1%">|g; |
27 | ## delete <br |
27 | ## delete <br> before table ? |
28 | $text =~ s|(<br\s*/>\s*){1,}</table>|</table>|g; |
28 | $text =~ s|(<br\s*/?>\s*){1,}</table>|</table>|g; |
29 | $text =~ s:</div>\s+</div>:</div></div>:g; |
29 | $text =~ s:</div>\s+</div>:</div></div>:g; |
30 | $text =~ s:</div>\s*(<br\s*/>\s*){1,}</div>:</div></div>:g; |
30 | $text =~ s:</div>\s*(<br\s*/?>\s*){1,}</div>:</div></div>:g; |
31 | ## delete <br/> before div |
31 | ## delete <br/> before div |
32 | $text =~ s:(<br\s*/>\s*){1,}<div:<div:g; |
32 | $text =~ s:(<br\s*/?>\s*){1,}<div:<div:g; |
33 | $text =~ s:<br\s*/> *!:< |
33 | $text =~ s:<br\s*/?> *!:<br>\n!:g; |
34 | $text =~ s:\n{3,}:\n\n:g; |
34 | $text =~ s:\n{3,}:\n\n:g; |
35 | close(IN); |
35 | close(IN); |
36 | 36 | ||
37 | open (OUT, ">$fileout"); |
37 | open (OUT, ">$fileout"); |
38 | print OUT $text ; close OUT; |
38 | print OUT $text ; close OUT; |