ricmitch_uk
Feb 10th, 2001, 04:40 AM
Thought that title'ld get some people's attention...
I need some help with this HTML stripping code, I'm having trouble removing style sheets, applet things, etc.
Can someone tell me where I'm going wrong with this code:
Private Sub StripIt()
On Error Resume Next
Dim strHTML As String
Dim intPos As Integer
Dim intPos2 As Integer
Dim intPos3 As Integer
Dim strTempText As String
Dim strTempText2 As String
Dim Temp As Integer
strHTML = WebBrowser1.Document.documentelement.InnerHTML
Do
If InStr(1, strHTML, "<") And InStr(1, strHTML, ">") <> 0 Then
intPos = InStr(1, strHTML, "<")
strTempText = Left$(strHTML, intPos - 1)
intPos2 = InStr(intPos, strHTML, ">")
Select Case LCase$(Mid$(strHTML, intPos, 7))
Case "<script", "<style>", "<applet"
intPos3 = InStr((intPos2 + 1), strHTML, ">")
strTempText2 = Right$(strHTML, (Len(strHTML) - intPos3))
GoTo EndSelect
Case Else
strTempText2 = Right$(strHTML, (Len(strHTML) - intPos2))
End Select
EndSelect:
strHTML = strTempText + strTempText2
Else
Exit Do
End If
Loop
txtPage.Text = strHTML
End Sub
Thanks for that.
I need some help with this HTML stripping code, I'm having trouble removing style sheets, applet things, etc.
Can someone tell me where I'm going wrong with this code:
Private Sub StripIt()
On Error Resume Next
Dim strHTML As String
Dim intPos As Integer
Dim intPos2 As Integer
Dim intPos3 As Integer
Dim strTempText As String
Dim strTempText2 As String
Dim Temp As Integer
strHTML = WebBrowser1.Document.documentelement.InnerHTML
Do
If InStr(1, strHTML, "<") And InStr(1, strHTML, ">") <> 0 Then
intPos = InStr(1, strHTML, "<")
strTempText = Left$(strHTML, intPos - 1)
intPos2 = InStr(intPos, strHTML, ">")
Select Case LCase$(Mid$(strHTML, intPos, 7))
Case "<script", "<style>", "<applet"
intPos3 = InStr((intPos2 + 1), strHTML, ">")
strTempText2 = Right$(strHTML, (Len(strHTML) - intPos3))
GoTo EndSelect
Case Else
strTempText2 = Right$(strHTML, (Len(strHTML) - intPos2))
End Select
EndSelect:
strHTML = strTempText + strTempText2
Else
Exit Do
End If
Loop
txtPage.Text = strHTML
End Sub
Thanks for that.