Chilkat HOME .NET Core C# Android™ AutoIt C C# C++ Chilkat2-Python CkPython Classic ASP DataFlex Delphi ActiveX Delphi DLL Go Java Lianja Mono C# Node.js Objective-C PHP ActiveX PHP Extension Perl PowerBuilder PowerShell PureBasic Ruby SQL Server Swift 2 Swift 3,4,5... Tcl Unicode C Unicode C++ VB.NET VBScript Visual Basic 6.0 Visual FoxPro Xojo Plugin
(Visual Basic 6.0) HTML Table to CSVDemonstrates a method for converting an HTML table to a CSV file. Note: This example requires Chilkat v9.5.0.77 or greater.
' This example requires the Chilkat API to have been previously unlocked. ' See Global Unlock Sample for sample code. ' First download the HTML containing the table Dim http As New ChilkatHttp Dim bdHtml As New ChilkatBinData Dim success As Long success = http.QuickGetBd("https://example-code.com/data/etf_table.html",bdHtml) If (success <> 1) Then Debug.Print http.LastErrorText Exit Sub End If ' Convert to XML. Dim htx As New HtmlToXml success = htx.SetHtmlBd(bdHtml) Dim sbXml As New ChilkatStringBuilder success = htx.ToXmlSb(sbXml) Dim xml As New ChilkatXml success = xml.LoadSb(sbXml,1) ' Remove attributes and sub-trees we don't need. ' (In other words, we're getting rid of clutter...) Dim numRemoved As Long numRemoved = xml.PruneTag("thead") numRemoved = xml.PruneAttribute("style") numRemoved = xml.PruneAttribute("class") ' Scrub the element and attribute content. xml.Scrub "ContentTrimEnds,ContentTrimInside,AttrTrimEnds,AttrTrimInside" ' Let's see what we have... Debug.Print xml.GetXml() ' We have the following XML. ' Copy this XML into the online tool at Generate Parsing Code from XML ' as a starting point for accessing the data.. ' <?xml version="1.0" encoding="utf-8"?> ' <root> ' <html> ' <head> ' <meta http-equiv="content-type" content="text/html; charset=UTF-8"/> ' </head> ' <body text="#000000" bgcolor="#FFFFFF"> ' <div> ' <div> ' <table role="grid" data-scrollx="true" data-sortdirection="desc" data-sorton="-1"/> ' </div> ' </div> ' <div> ' <table id="topHoldingsTable" role="grid" data-scrollx="true" data-sortdirection="desc" data-sorton="-1"> ' <tbody> ' <tr role="row"> ' <td> ' <text>ITUB4</text> ' </td> ' <td> ' <text>ITAU UNIBANCO HOLDING PREF SA</text> ' </td> ' <td> ' <text>Financials</text> ' </td> ' <td> ' <text>Brazil</text> ' </td> ' <td> ' <text>10.94</text> ' </td> ' <td> ' <text>998,954,813.73</text> ' </td> ' </tr> ' <tr role="row"> ' <td> ' <text>BBDC4</text> ' </td> ' <td> ' <text>BANCO BRADESCO PREF SA</text> ' </td> ' <td> ' <text>Financials</text> ' </td> ' <td> ' <text>Brazil</text> ' </td> ' <td> ' <text>9.01</text> ' </td> ' <td> ' <text>822,164,622.75</text> ' </td> ' </tr> ' ... ' ... ' ... ' </tbody> ' </table> ' </div> ' </body> ' </html> ' </root> ' ' This is the code generated by the online tool: ' Dim i As Long Dim count_i As Long Dim table_role As String Dim table_data_scrollx As String Dim table_data_sortdirection As String Dim table_data_sorton As String Dim table_id As String Dim j As Long Dim count_j As Long Dim tr_role As String Dim k As Long Dim count_k As Long Dim tagPath As String Dim text As String i = 0 count_i = xml.NumChildrenHavingTag("html|body|div") Do While i < count_i xml.I = i table_role = xml.ChilkatPath("html|body|div[i]|div|table|(role)") table_data_scrollx = xml.ChilkatPath("html|body|div[i]|div|table|(data-scrollx)") table_data_sortdirection = xml.ChilkatPath("html|body|div[i]|div|table|(data-sortdirection)") table_data_sorton = xml.ChilkatPath("html|body|div[i]|div|table|(data-sorton)") table_id = xml.ChilkatPath("html|body|div[i]|table|(id)") table_role = xml.ChilkatPath("html|body|div[i]|table|(role)") table_data_scrollx = xml.ChilkatPath("html|body|div[i]|table|(data-scrollx)") table_data_sortdirection = xml.ChilkatPath("html|body|div[i]|table|(data-sortdirection)") table_data_sorton = xml.ChilkatPath("html|body|div[i]|table|(data-sorton)") j = 0 count_j = xml.NumChildrenHavingTag("html|body|div[i]|table|tbody|tr") Do While j < count_j xml.J = j tr_role = xml.ChilkatPath("html|body|div[i]|table|tbody|tr[j]|(role)") k = 0 count_k = xml.NumChildrenHavingTag("html|body|div[i]|table|tbody|tr[j]|td") Do While k < count_k xml.K = k text = xml.GetChildContent("html|body|div[i]|table|tbody|tr[j]|td[k]|text") k = k + 1 Loop j = j + 1 Loop i = i + 1 Loop ' Let's modify the above code to build the CSV. Dim csv As New ChilkatCsv success = csv.SetColumnName(0,"Ticker") success = csv.SetColumnName(1,"Name") success = csv.SetColumnName(2,"Sector") success = csv.SetColumnName(3,"Country") success = csv.SetColumnName(4,"Weight") success = csv.SetColumnName(5,"Notional Vaue") i = 0 count_i = xml.NumChildrenHavingTag("html|body|div") Do While i < count_i xml.I = i j = 0 count_j = xml.NumChildrenHavingTag("html|body|div[i]|table|tbody|tr") Do While j < count_j xml.J = j k = 0 count_k = xml.NumChildrenHavingTag("html|body|div[i]|table|tbody|tr[j]|td") Do While k < count_k xml.K = k success = csv.SetCell(j,k,xml.GetChildContent("html|body|div[i]|table|tbody|tr[j]|td[k]|text")) k = k + 1 Loop j = j + 1 Loop i = i + 1 Loop success = csv.SaveFile("qa_output/brasil_etf.csv") Dim csvStr As String csvStr = csv.SaveToString() Debug.Print csvStr ' Our CSV looks like this: ' Ticker,Name,Sector,Country,Weight,Notional Vaue ' ITUB4,ITAU UNIBANCO HOLDING PREF SA,Financials,Brazil,10.94,"998,954,813.73" ' BBDC4,BANCO BRADESCO PREF SA,Financials,Brazil,9.01,"822,164,622.75" ' VALE3,CIA VALE DO RIO DOCE SH,Materials,Brazil,8.60,"785,290,260.07" ' PETR4,PETROLEO BRASILEIRO PREF SA,Energy,Brazil,5.68,"518,124,434.10" ' PETR3,PETROBRAS,Energy,Brazil,4.86,"443,254,438.53" ' B3SA3,B3 BRASIL BOLSA BALCAO SA,Financials,Brazil,4.57,"417,636,740.16" ' ABEV3,AMBEV SA,Consumer Staples,Brazil,4.57,"417,216,913.63" ' BBAS3,BANCO DO BRASIL SA,Financials,Brazil,3.25,"296,921,232.15" ' ITSA4,ITAUSA INVESTIMENTOS ITAU PREF SA,Financials,Brazil,2.90,"265,153,684.52" ' LREN3,LOJAS RENNER SA,Consumer Discretionary,Brazil,2.25,"205,832,175.98" ' |
© 2000-2024 Chilkat Software, Inc. All Rights Reserved.