CINXE.COM

Blueprints : Beautiful Soup

<!DOCTYPE html> <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en" dir="ltr"> <head> <base href="https://blueprints.launchpad.net/beautifulsoup/+specs" /> <meta charset="UTF-8" /> <title>Blueprints : Beautiful Soup</title> <link rel="apple-touch-icon" sizes="180x180" href="/@@/apple-touch-icon.png?v=2022" /> <link rel="icon" type="image/png" sizes="32x32" href="/@@/favicon-32x32.png?v=2022" /> <link rel="icon" type="image/png" sizes="16x16" href="/@@/favicon-16x16.png?v=2022" /> <link rel="manifest" href="/@@/site.webmanifest?v=2022" /> <link rel="mask-icon" href="/@@/safari-pinned-tab.svg?v=2022" color="#e9531f" /> <link rel="shortcut icon" href="/@@/favicon.ico?v=2022" /> <meta name="msapplication-TileColor" content="#da532c" /> <meta name="msapplication-config" content="/@@/browserconfig.xml?v=2022" /> <meta name="theme-color" content="#ffffff" /> <link type="text/css" rel="stylesheet" media="screen, print" href="/+icing/rev78860d903de6d6d7dd5a0ade63efaca45d3467e2/combo.css" /> <meta property="og:title" content="Blueprints : Beautiful Soup" /> <meta property="og:type" content="website" /> <meta property="og:image" content="/@@/launchpad-og-image.png" /> <meta property="og:url" content="https://blueprints.launchpad.net/beautifulsoup/+specs" /> <meta property="og:site_name" content="Launchpad" /> <script type="text/javascript"> var LP = { cache: {}, links: {} }; </script> <script type="text/javascript">var cookie_scope = '; Path=/; Secure; Domain=.launchpad.net';</script> <script type="text/javascript" src="/+combo/rev78860d903de6d6d7dd5a0ade63efaca45d3467e2/?yui/yui/yui-min.js&amp;lp/meta.js&amp;yui/loader/loader-min.js"></script> <script type="text/javascript"> var raw = null; if (LP.devmode) { raw = 'raw'; } YUI.GlobalConfig = { combine: true, comboBase: '/+combo/rev78860d903de6d6d7dd5a0ade63efaca45d3467e2/?', root: 'yui/', filter: raw, debug: false, fetchCSS: false, maxURLLength: 2000, groups: { lp: { combine: true, base: '/+combo/rev78860d903de6d6d7dd5a0ade63efaca45d3467e2/?lp/', comboBase: '/+combo/rev78860d903de6d6d7dd5a0ade63efaca45d3467e2/?', root: 'lp/', // comes from including lp/meta.js modules: LP_MODULES, fetchCSS: false } } }</script> <script type="text/javascript"> // we need this to create a single YUI instance all events and code // talks across. All instances of YUI().use should be based off of // LPJS instead. var LPJS = new YUI(); </script> <script id="base-layout-load-scripts" type="text/javascript"> //<![CDATA[ LPJS.use('base', 'node', 'console', 'event', 'oop', 'lp', 'lp.app.foldables','lp.app.sorttable', 'lp.app.inlinehelp', 'lp.app.links', 'lp.bugs.bugtask_index', 'lp.bugs.subscribers', 'lp.app.ellipsis', 'lp.code.branchmergeproposal.diff', 'lp.views.global', function(Y) { Y.on("domready", function () { var global_view = new Y.lp.views.Global(); global_view.render(); Y.lp.app.sorttable.SortTable.init(); Y.lp.app.inlinehelp.init_help(); Y.lp.activate_collapsibles(); Y.lp.app.foldables.activate(); Y.lp.app.links.check_valid_lp_links(); }); Y.on('lp:context:web_link:changed', function(e) { window.location = e.new_value; }); }); //]]> </script> <script id="base-helper-functions" type="text/javascript"> //<![CDATA[ // This code is pulled from lp.js that needs to be available on every // request. Pulling here to get it outside the scope of the YUI block. function setFocusByName(name) { // Focus the first element matching the given name which can be focused. var nodes = document.getElementsByName(name); var i, node; for (i = 0; i < nodes.length; i++) { node = nodes[i]; if (node.focus) { try { // Trying to focus a hidden element throws an error in IE8. if (node.offsetHeight !== 0) { node.focus(); } } catch (e) { LPJS.use('console', function(Y) { Y.log('In setFocusByName(<' + node.tagName + ' type=' + node.type + '>): ' + e); }); } break; } } } function selectWidget(widget_name, event) { if (event && (event.keyCode === 9 || event.keyCode === 13)) { // Avoid firing if user is tabbing through or simply pressing // enter to submit the form. return; } document.getElementById(widget_name).checked = true; } //]]> </script> <meta name="robots" content="noindex,nofollow" /> </head> <body id="document" itemscope="" itemtype="http://schema.org/WebPage" class="tab-specifications main_side public yui3-skin-sam"> <div class="yui-d0"> <div id="locationbar" class="login-logout"> <div id="logincontrol"><a href="https://blueprints.launchpad.net/beautifulsoup/+login">Log in / Register</a></div> </div><!--id="locationbar"--> <div id="watermark" class="watermark-apps-portlet"> <div> <a href="https://launchpad.net/beautifulsoup"><img alt="" width="64" height="64" src="/@@/product-logo" /></a> </div> <div class="wide"> <h2 id="watermark-heading"><a href="https://launchpad.net/beautifulsoup">Beautiful Soup</a></h2> </div> <!-- Application Menu --> <ul class="facetmenu"> <li class="overview"><a href="https://launchpad.net/beautifulsoup">Overview</a></li> <li class="branches"><a href="https://code.launchpad.net/beautifulsoup">Code</a></li> <li class="bugs"><a href="https://bugs.launchpad.net/beautifulsoup">Bugs</a></li> <li class="specifications active"><span>Blueprints</span></li> <li class="translations"><a href="https://translations.launchpad.net/beautifulsoup">Translations</a></li> <li class="answers"><a href="https://answers.launchpad.net/beautifulsoup">Answers</a></li> </ul> </div> <div class="yui-t4"> <div id="maincontent" class="yui-main"> <div class="yui-b" dir="ltr"> <div class="context-publication"> <h1>Blueprints for Beautiful Soup</h1> <div id="registration" class="registering"> </div> </div> <div id="request-notifications"> </div> <div> <div class="top-portlet"> <div id="specs-unknown"> <strong> <p> Launchpad does not know how Beautiful Soup tracks feature planning or documentation. </p> </strong> </div> </div> </div> </div><!-- yui-b --> </div><!-- yui-main --> <div id="side-portlets" class="yui-b side"> </div><!-- yui-b side --> </div><!-- yui-t4 --> <div id="footer" class="footer"> <div class="lp-arcana"> <div class="lp-branding"> <a href="https://launchpad.net/"><img src="/@@/launchpad-footer-logo.svg" alt="Launchpad" width="65" height="18" /></a> &nbsp;&bull;&nbsp; <a href="https://launchpad.net/+tour">Take the tour</a> &nbsp;&bull;&nbsp; <a href="https://help.launchpad.net/">Read the guide</a> &nbsp; <form id="globalsearch" method="get" accept-charset="UTF-8" action="https://launchpad.net/+search"> <input type="search" id="search-text" name="field.text" /> <input type="image" src="/@@/search" style="vertical-align:5%" alt="Search Launchpad" /> </form> </div> </div> <div class="colophon"> &copy; 2004 <a href="http://canonical.com/">Canonical&nbsp;Ltd.</a> &nbsp;&bull;&nbsp; <a href="https://launchpad.net/legal">Terms of use</a> &nbsp;&bull;&nbsp; <a href="https://www.ubuntu.com/legal/dataprivacy">Data privacy</a> &nbsp;&bull;&nbsp; <a href="/feedback">Contact Launchpad Support</a> &nbsp;&bull;&nbsp; <a href="http://blog.launchpad.net/">Blog</a> &nbsp;&bull;&nbsp; <a href="https://canonical.com/careers">Careers</a> &nbsp;&bull;&nbsp; <a href="https://ubuntu.social/@launchpadstatus">System status</a> <span id="lp-version"> &nbsp;&bull;&nbsp; 78860d9 (<a href="https://dev.launchpad.net/">Get the code!</a>) </span> </div> </div> </div><!-- yui-d0--> <script id="json-cache-script">LP.cache = {"related_features": {}, "context": {"self_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup", "web_link": "https://launchpad.net/beautifulsoup", "resource_type_link": "https://blueprints.launchpad.net/api/devel/#project", "translations_usage": "Not Applicable", "official_answers": false, "official_blueprints": false, "official_codehosting": true, "official_bugs": true, "information_type": "Public", "active": true, "all_specifications_collection_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/all_specifications", "valid_specifications_collection_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/valid_specifications", "bug_reporting_guidelines": "** Please read this! There's a good chance you can solve your problem without having to file a bug! **\n\nThe most common bug filed against Beautiful Soup is \"Beautiful Soup didn't parse my document\" or \"Beautiful Soup parsed my document incorrectly.\" (See bug 972524, bug 976903, and bug 1014467 for real-life examples.) Most of the time, this is not a problem with Beautiful Soup: it's a sign that you need to install a third-party HTML parsing library. \n\nBeautiful Soup does not include an HTML parser of its own: it uses whatever you have installed. If you don't have anything installed, Beautiful Soup will use Python's built-in HTML parser. Different parsers will parse the same markup differently, so if the built-in parser doesn't understand your markup in a way that's helpful, you may have better luck installing a third-party parser like lxml or html5lib. See http://www.crummy.com/software/BeautifulSoup/bs4/doc/#installing-a-parser for details.\n\n** If you're sure there's a bug **\n\nWhen filing a bug against Beautiful Soup, the best way to get the problem resolved quickly is to provide a self-contained Python script that duplicates the problem. If your problem only happens on a certain web page, upload the HTML as an attachment to the bug. Please don't just mention the URL to the web page. Web pages change all the time, and by the time I look at your bug it may no longer cause the problem.\n\nFinally, please mention whether you have html5lib or lxml installed on your system, what version of Python you're running, and which parser you were using when you encountered the problem. Some bugs in Beautiful Soup only show up when certain parsers are used.\n", "content_templates": null, "bug_reported_acknowledgement": null, "official_bug_tags": [], "recipes_collection_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/recipes", "webhooks_collection_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/webhooks", "bug_supervisor_link": "https://blueprints.launchpad.net/api/devel/~leonardr", "active_milestones_collection_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/active_milestones", "all_milestones_collection_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/all_milestones", "translationgroup_link": null, "translationpermission": "Open", "qualifies_for_free_hosting": true, "reviewer_whiteboard": "tag:launchpad.net:2008:redacted", "is_permitted": "tag:launchpad.net:2008:redacted", "project_reviewed": "tag:launchpad.net:2008:redacted", "license_approved": "tag:launchpad.net:2008:redacted", "private": false, "display_name": "Beautiful Soup", "icon_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/icon", "logo_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/logo", "name": "beautifulsoup", "owner_link": "https://blueprints.launchpad.net/api/devel/~leonardr", "project_group_link": null, "title": "Beautiful Soup", "registrant_link": "https://blueprints.launchpad.net/api/devel/~leonardr", "driver_link": null, "summary": "A program designed for screen-scraping HTML. The discussion group is at: http://groups.google.com/group/beautifulsoup", "description": null, "date_created": "2009-03-13T21:33:54.049945+00:00", "homepage_url": "http://www.crummy.com/software/BeautifulSoup/", "wiki_url": null, "screenshots_url": null, "download_url": null, "programming_language": "Python", "sourceforge_project": null, "freshmeat_project": null, "brand_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/brand", "branch_sharing_policy": "Public", "bug_sharing_policy": "Public", "specification_sharing_policy": "Public", "licenses": ["Simplified BSD Licence"], "license_info": null, "bug_tracker_link": null, "series_collection_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/series", "development_focus_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/4.0", "releases_collection_link": "https://blueprints.launchpad.net/api/devel/beautifulsoup/releases", "translation_focus_link": null, "commercial_subscription_link": null, "commercial_subscription_is_due": false, "remote_product": null, "vcs": "Git", "http_etag": "\"002b338519b5ac3ee39bbc8b49c7420627d76e32-0fc5e5ff42f19ff38e8ad155caad83a4a062c446\""}};</script> </body> <!-- Facet name: specifications Page type: main_side Has global search: True Has application tabs: True Has side portlets: True At least 13 queries/external actions issued in 0.13 seconds Features: {'profiling.enabled': None, 'hard_timeout': '5000', 'js.yui_version': None, 'app.mainsite_only.canonical_url': None, 'app.maintenance_message': None, 'baselayout.careers_link.disabled': None, 'visible_render_time': None} r78860d9 --> </html>

Pages: 1 2 3 4 5 6 7 8 9 10