Results 1 to 22 of 22

Thread: [RESOLVED] How do I remove JavaScript from HTML source using Regular Expressions. Almost solved.

Threaded View

  1. #14
    PowerPoster
    Join Date
    May 2006
    Posts
    2,988

    Re: How do I remove JavaScript from HTML source using Regular Expressions. Almost sol

    And without RegExpressions ..

    Added removal of Extra Chars, Special Symbols, Single Letters, Digits, Common Words. Upper Case first letter of each word.

    VB Code:
    1. Option Explicit
    2.  
    3. Private Sub Command1_Click()
    4.     Dim i As String
    5.     i = Inet1.OpenURL("http://www.yujunet.com/")
    6.     If Len(i) Then
    7.         i = RemoveLines(i)
    8.         i = RemoveTags(i, "<style", "</style>")
    9.         i = RemoveTags(i, "<script", "</script>")
    10.         i = RemoveTags(i, "<!--", "-->")
    11.         i = RemoveTags(i, "<", ">")
    12.         i = RemoveTags(i, "&#", ";")  ' SPECIAL SYMBOLS
    13.         i = RemoveChars(i, "&nbsp#&amp;#&quot#&gt;#&lt;#[#]#""#;#:#.#,#'#/#$#%#?#!#|#(#)#=#-#+#&#*#©#®")
    14.         i = RemoveDigits(i, "0 1 2 3 4 5 6 7 8 9")
    15.         i = RemoveCommon(i, "a b c d e f g h i j k l m n o p q r s t u v w x y z")
    16.         i = RemoveCommon(i, "at and com is or of to that this then the was what with where who when")
    17.         i = RemoveMultiple(i, "  ")   ' GET RID OF MULTIPLE SPACES
    18.         i = StrConv(i, vbProperCase)  ' UPPER CASE FIRST LETTER
    19.         Text1 = Trim$(i)
    20.     End If
    21. End Sub
    22.  
    23. Private Function RemoveTags(ByVal myString As String, _
    24.     start As String, finish As String) As String
    25.     Dim sArray() As String, i As Integer
    26.     Dim iPor As String, iPoe As Integer
    27.     sArray = Split(myString, start, , 3)                            ' SPLIT BY TAG START
    28.     For i = 0 To UBound(sArray)                                     ' LOOP THROUGH
    29.         iPoe = InStr(1, sArray(i), finish, 3)                       ' GET REPLACE LENGTH
    30.         If iPoe Then                                                ' IF EXISTS IN TEXT
    31.             iPor = start & Mid$(sArray(i), 1, (iPoe - 1)) & finish  ' OUR REPLACE STRING
    32.             myString = Trim$(Replace(myString, iPor, " ", , , 3))   ' REPLACE IN TEXT
    33.         End If
    34.     Next i                                                          ' NEXT TAG START
    35.     RemoveTags = myString
    36. End Function
    37.  
    38. Private Function RemoveCommon(ByVal myString As String, _
    39.     myVal As String) As String
    40.     Dim sArray() As String, i As Integer
    41.     sArray = Split(myVal)
    42.     For i = 0 To UBound(sArray)
    43.         Do While (InStr(1, " " & myString & " ", " " & sArray(i) & " ", 3))
    44.             myString = Replace(" " & myString & " ", " " & sArray(i) & " ", " ", , , 3)
    45.         Loop
    46.     Next
    47.     RemoveCommon = myString
    48. End Function
    49.  
    50. Private Function RemoveDigits(ByVal myString As String, _
    51.     myVal As String) As String
    52.     Dim sArray() As String, i As Integer
    53.     sArray = Split(myVal)
    54.     For i = 0 To UBound(sArray)
    55.         Do While (InStr(myString, sArray(i)))
    56.             myString = Replace(myString, sArray(i), " ")
    57.         Loop
    58.     Next
    59.     RemoveDigits = myString
    60. End Function
    61.  
    62. Private Function RemoveChars(ByVal myString As String, _
    63.     myVal As String) As String
    64.     Dim sArray() As String, i As Integer
    65.     sArray = Split(myVal, "#")
    66.     For i = 0 To UBound(sArray)
    67.         myString = Replace(myString, sArray(i), " ", , , 3)
    68.     Next i
    69.     myString = Replace(myString, "#", " ")
    70.     RemoveChars = myString
    71. End Function
    72.  
    73. Private Function RemoveMultiple(ByVal myString As String, _
    74.     myVal As String) As String
    75.     Do While (InStr(myString, myVal))
    76.         myString = Replace(myString, myVal, " ", , , 3)
    77.     Loop
    78.     RemoveMultiple = myString
    79. End Function
    80.  
    81. Private Function RemoveLines(ByVal myString As String) As String
    82.     myString = Replace(myString, vbTab, " ")
    83.     myString = Replace(myString, Chr(13), " ")
    84.     myString = Replace(myString, Chr(10), " ")
    85.     RemoveLines = myString
    86. End Function
    Last edited by rory; Jun 20th, 2006 at 06:17 PM.

Posting Permissions

  • You may not post new threads
  • You may not post replies
  • You may not post attachments
  • You may not edit your posts
  •  



Click Here to Expand Forum to Full Width