html < /h4>
[code]$Html = @'
Title
Some header elements
huge text in between aside
huge text in between div
Some other elements
'@
< /code>
Analyse < /h4>
function ParseHtml($String) {
$Unicode = [System.Text.Encoding]::Unicode.GetBytes($String)
$Html = New-Object -Com 'HTMLFile'
if ($Html.PSObject.Methods.Name -Contains 'IHTMLDocument2_Write') {
$Html.IHTMLDocument2_Write($Unicode)
}
else {
$Html.write($Unicode)
}
$Html.Close()
$Html
}
$Document = ParseHtml $Html
< /code>
[/code]
Code: Select all
$Document.getElementsByTagName('aside') | ForEach-Object { $_.OuterHTML }
< /code>
[h4]
Code: Select all
$Document.getElementsByTagName('div') | ForEach-Object { $_.OuterHTML }
huge text in between div
< /code>
[list]
[*] Was ist so besonders für das Element < /code>, das den Unterschied zu anderen Elementen wie z. a
[*] Wie ist der richtige Weg, um das gesamte Element und bis zum End -Tag einzubeziehen?
[/list]