Deploy vinta/awesome-python to github.com/vinta/awesome-python.git:gh-pages

2024-11-13 11:16:10 -05:00 · 2019-05-25 10:05:43 +00:00 · 2019-05-25 10:05:43 +00:00 · 5644990ecb
commit 5644990ecb
parent 4f9a8dd9e1
3 changed files with 9 additions and 9 deletions
--- a/index.html
+++ b/index.html
@ -871,8 +871,8 @@
 </li>
      
        <li class="md-nav__item">
-  <a href="#web-crawling-web-scraping" title="Web Crawling &amp; Web Scraping" class="md-nav__link">
-    Web Crawling &amp; Web Scraping
+  <a href="#web-crawling" title="Web Crawling" class="md-nav__link">
+    Web Crawling
  </a>
  
 </li>
@ -1497,8 +1497,8 @@
 </li>
      
        <li class="md-nav__item">
-  <a href="#web-crawling-web-scraping" title="Web Crawling &amp; Web Scraping" class="md-nav__link">
-    Web Crawling &amp; Web Scraping
+  <a href="#web-crawling" title="Web Crawling" class="md-nav__link">
+    Web Crawling
  </a>
  
 </li>
@ -1621,7 +1621,7 @@
 <li><a href="#video">Video</a></li>
 <li><a href="#web-asset-management">Web Asset Management</a></li>
 <li><a href="#web-content-extracting">Web Content Extracting</a></li>
-<li><a href="#web-crawling--web-scraping">Web Crawling &amp; Web Scraping</a></li>
+<li><a href="#web-crawling">Web Crawling</a></li>
 <li><a href="#web-frameworks">Web Frameworks</a></li>
 <li><a href="#websocket">WebSocket</a></li>
 <li><a href="#wsgi-servers">WSGI Servers</a></li>
@ -2755,17 +2755,17 @@ Code Formatters</li>
 <li><a href="https://github.com/deanmalmgren/textract">textract</a> - Extract text from any document, Word, PowerPoint, PDFs, etc.</li>
 <li><a href="https://github.com/gaojiuli/toapi">toapi</a> - Every web site provides APIs.</li>
 </ul>
-<h2 id="web-crawling-web-scraping">Web Crawling &amp; Web Scraping</h2>
-<p><em>Libraries to automate data extraction from websites.</em></p>
+<h2 id="web-crawling">Web Crawling</h2>
+<p><em>Libraries to automate web data extraction.</em></p>
 <ul>
 <li><a href="https://github.com/chineking/cola">cola</a> - A distributed crawling framework.</li>
 <li><a href="https://pythonhosted.org/feedparser/">feedparser</a> - Universal feed parser.</li>
 <li><a href="https://github.com/lorien/grab">grab</a> - Site scraping framework.</li>
 <li><a href="https://github.com/MechanicalSoup/MechanicalSoup">MechanicalSoup</a> - A Python library for automating interaction with websites.</li>
-<li><a href="https://github.com/scrapinghub/portia">portia</a> - Visual scraping for Scrapy.</li>
 <li><a href="https://github.com/binux/pyspider">pyspider</a> - A powerful spider system.</li>
 <li><a href="https://github.com/jmcarp/robobrowser">robobrowser</a> - A simple, Pythonic library for browsing the web without a standalone web browser.</li>
 <li><a href="https://scrapy.org/">scrapy</a> - A fast high-level screen scraping and web crawling framework.</li>
+<li><a href="https://github.com/scrapinghub/portia">portia</a> - Visual scraping for Scrapy.</li>
 </ul>
 <h2 id="web-frameworks">Web Frameworks</h2>
 <p><em>Full stack web frameworks.</em></p>
--- a/search/search_index.json
+++ b/search/search_index.json
--- a/sitemap.xml.gz
+++ b/sitemap.xml.gz