6:[["$","$Le",null,{}],["$","div",null,{"className":"min-h-screen bg-gray-100 p-6","children":[["$","$Lf",null,{}],["$","script",null,{"type":"application/ld+json","dangerouslySetInnerHTML":{"__html":"$10"}}],["$","div",null,{"className":"bg-white shadow-md rounded-lg p-6 mb-6 relative","children":[["$","div",null,{"className":"absolute top-4 right-4 flex flex-wrap space-x-2","children":[["$","span","python",{"className":"bg-blue-600 text-white text-sm px-3 py-1 rounded-full","children":["$","$L11",null,{"href":"/discussion/tag/python/1","children":"python"}]}],["$","span","lxml.html",{"className":"bg-blue-600 text-white text-sm px-3 py-1 rounded-full","children":["$","$L11",null,{"href":"/discussion/tag/lxml.html/1","children":"lxml.html"}]}]]}],["$","div",null,{"className":"flex items-center mb-4","children":[["$","img",null,{"src":"https://www.gravatar.com/avatar/82af83259a9fbe0e9744c0af1503de07?s=256&d=identicon&r=PG&f=y&so-version=2","alt":"user3412816","className":"w-16 h-16 rounded-full border"}],["$","div",null,{"className":"ml-4","children":[["$","a",null,{"href":"https://stackoverflow.com/users/3412816/user3412816","target":"_blank","rel":"noopener noreferrer","className":"text-lg font-semibold text-blue-600 hover:underline","children":"user3412816"}],["$","p",null,{"className":"text-sm text-gray-500","children":["Reputation: ",53]}]]}]]}],["$","h1",null,{"className":"text-2xl font-bold text-gray-800 mb-4","children":"How to parse HTML using the lxml.html library"}],["$","p",null,{"className":"text-gray-700 mt-4","dangerouslySetInnerHTML":{"__html":"

Here is the HTML that appears on my site:

\n\n

<meta content=\"auth\" name=\"param\" />\n<meta content=\"I_WANT_THIS\" name=\"token\" />\n

\n\n

How can I use lxml.html to grab that?

\n"}}],["$","div",null,{"className":"text-gray-600 text-sm mt-4","children":[["$","p",null,{"children":["Upvotes: ",1]}],["$","p",null,{"children":["Views: ",1133]}]]}]]}],["$","div",null,{"className":"container mx-auto","children":[["$","h2",null,{"className":"text-2xl font-semibold text-gray-800 mb-6","children":["Answers (",1,")"]}],[["$","div","22364589",{"className":"bg-white shadow-md rounded-lg p-6 mb-6","children":[["$","div",null,{"className":"flex items-center mb-4","children":[["$","img",null,{"src":"https://i.sstatic.net/2DTBv.jpg?s=256","alt":"alecxe","className":"w-12 h-12 rounded-full border"}],["$","div",null,{"className":"ml-4","children":[["$","a",null,{"href":"https://stackoverflow.com/users/771848/alecxe","target":"_blank","rel":"noopener noreferrer","className":"text-lg font-semibold text-blue-600 hover:underline","children":"alecxe"}],["$","p",null,{"className":"text-sm text-gray-500","children":["Reputation: ",474171]}]]}]]}],["$","p",null,{"className":"text-gray-700 mb-4","dangerouslySetInnerHTML":{"__html":"

Use xpath to find the meta tag by name attribute and get the value of content attribute:

\n\n

from lxml.html import fromstring\n\n\nhtml_data = \"\"\" <meta content=\"auth\" name=\"param\" />\n <meta content=\"I_WANT_THIS\" name=\"token\" />\"\"\"\n\ntree = fromstring(html_data)\nprint tree.xpath('//meta[@name=\"token\"]/@content')\n

\n\n

prints:

\n\n

['I_WANT_THIS']\n

\n"}}],["$","div",null,{"className":"text-gray-600 text-sm","children":["$","p",null,{"children":["Upvotes: ",2]}]}]]}]]]}],["$","div",null,{"className":"bg-white shadow-md rounded-lg p-6 mt-6","children":[["$","h2",null,{"className":"text-2xl font-semibold text-gray-800 mb-4","children":"Related Questions"}],["$","ul",null,{"className":"list-disc list-inside","children":[["$","li","39981846",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/39981846","className":"text-blue-600 hover:underline","children":"how can i parse html with lxml"}]}],["$","li","18433506",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/18433506","className":"text-blue-600 hover:underline","children":"Parsing HTML with lxml (python)"}]}],["$","li","7778128",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/7778128","className":"text-blue-600 hover:underline","children":"Parsing html with lxml on python"}]}],["$","li","8635903",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/8635903","className":"text-blue-600 hover:underline","children":"Parsing HTML data with lxml"}]}],["$","li","3569152",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/3569152","className":"text-blue-600 hover:underline","children":"Parsing HTML with Lxml"}]}],["$","li","14663659",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/14663659","className":"text-blue-600 hover:underline","children":"Parse HTML using LXML in Python"}]}],["$","li","12073781",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/12073781","className":"text-blue-600 hover:underline","children":"Parsing HTML documents using lxml in python"}]}],["$","li","11795077",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/11795077","className":"text-blue-600 hover:underline","children":"Simple example regarding how to parse data from html output using lxml"}]}],["$","li","5646032",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/5646032","className":"text-blue-600 hover:underline","children":"HTML parsing using lxml code"}]}],["$","li","4180887",{"className":"mb-2","children":["$","$L11",null,{"href":"/discussion/solution/4180887","className":"text-blue-600 hover:underline","children":"How can I parse html using lxml , python"}]}]]}]]}]]}],["$","$L12",null,{}],["$","$L13",null,{}],["$","$L14",null,{}],["$","$L15",null,{}],["$","$L16",null,{}]]

How to parse HTML using the lxml.html library

Answers (1)

Related Questions