NP URI: www.nobleprog.com.eg/cc/pythonwebscraping Undefined array key 0 /apps/hitra7/npfrontend/nptemplates/default.php:137 Array ( [0] => Array ( [file] => /apps/hitra7/npfrontend/nptemplates/default.php [line] => 137 [function] => {closure:/apps/hitra7/npfrontend/index.php:5} [args] => Array ( [0] => 2 [1] => Undefined array key 0 [2] => /apps/hitra7/npfrontend/nptemplates/default.php [3] => 137 ) ) [1] => Array ( [file] => /apps/hitra7/npfrontend/modules/course/course.php [line] => 141 [args] => Array ( [0] => /apps/hitra7/npfrontend/nptemplates/default.php ) [function] => require_once ) [2] => Array ( [file] => /apps/hitra7/npfrontend/core/routes.php [line] => 16 [function] => course_menu_callback [args] => Array ( [0] => /cc/pythonwebscraping ) ) [3] => Array ( [file] => /apps/hitra7/npfrontend/__index.php [line] => 94 [args] => Array ( [0] => /apps/hitra7/npfrontend/core/routes.php ) [function] => require_once ) [4] => Array ( [file] => /apps/hitra7/npfrontend/index.php [line] => 17 [args] => Array ( [0] => /apps/hitra7/npfrontend/__index.php ) [function] => include_once ) [5] => Array ( [file] => /apps/hitra7/index.php [line] => 65 [args] => Array ( [0] => /apps/hitra7/npfrontend/index.php ) [function] => include_once ) ) NP URI: www.nobleprog.com.eg/cc/pythonwebscraping Undefined array key 1 /apps/hitra7/npfrontend/nptemplates/default.php:137 Array ( [0] => Array ( [file] => /apps/hitra7/npfrontend/nptemplates/default.php [line] => 137 [function] => {closure:/apps/hitra7/npfrontend/index.php:5} [args] => Array ( [0] => 2 [1] => Undefined array key 1 [2] => /apps/hitra7/npfrontend/nptemplates/default.php [3] => 137 ) ) [1] => Array ( [file] => /apps/hitra7/npfrontend/modules/course/course.php [line] => 141 [args] => Array ( [0] => /apps/hitra7/npfrontend/nptemplates/default.php ) [function] => require_once ) [2] => Array ( [file] => /apps/hitra7/npfrontend/core/routes.php [line] => 16 [function] => course_menu_callback [args] => Array ( [0] => /cc/pythonwebscraping ) ) [3] => Array ( [file] => /apps/hitra7/npfrontend/__index.php [line] => 94 [args] => Array ( [0] => /apps/hitra7/npfrontend/core/routes.php ) [function] => require_once ) [4] => Array ( [file] => /apps/hitra7/npfrontend/index.php [line] => 17 [args] => Array ( [0] => /apps/hitra7/npfrontend/__index.php ) [function] => include_once ) [5] => Array ( [file] => /apps/hitra7/index.php [line] => 65 [args] => Array ( [0] => /apps/hitra7/npfrontend/index.php ) [function] => include_once ) ) NP URI: www.nobleprog.com.eg/cc/pythonwebscraping Undefined array key 2 /apps/hitra7/npfrontend/nptemplates/default.php:137 Array ( [0] => Array ( [file] => /apps/hitra7/npfrontend/nptemplates/default.php [line] => 137 [function] => {closure:/apps/hitra7/npfrontend/index.php:5} [args] => Array ( [0] => 2 [1] => Undefined array key 2 [2] => /apps/hitra7/npfrontend/nptemplates/default.php [3] => 137 ) ) [1] => Array ( [file] => /apps/hitra7/npfrontend/modules/course/course.php [line] => 141 [args] => Array ( [0] => /apps/hitra7/npfrontend/nptemplates/default.php ) [function] => require_once ) [2] => Array ( [file] => /apps/hitra7/npfrontend/core/routes.php [line] => 16 [function] => course_menu_callback [args] => Array ( [0] => /cc/pythonwebscraping ) ) [3] => Array ( [file] => /apps/hitra7/npfrontend/__index.php [line] => 94 [args] => Array ( [0] => /apps/hitra7/npfrontend/core/routes.php ) [function] => require_once ) [4] => Array ( [file] => /apps/hitra7/npfrontend/index.php [line] => 17 [args] => Array ( [0] => /apps/hitra7/npfrontend/__index.php ) [function] => include_once ) [5] => Array ( [file] => /apps/hitra7/index.php [line] => 65 [args] => Array ( [0] => /apps/hitra7/npfrontend/index.php ) [function] => include_once ) )

Course Outline

Introduction

Setting up the Development Environment

Python Primer: Data Structures, Conditionals, File Handling, etc.

Python Packages for Web Scraping: Scrapy and BeautifulSoup

How a Website Works

How HTML is Structured

Making a Web Request

Scraping an HTML Page

Working with XPath and CSS

Filtering Data Using Regular Expressions

Creating a Web Crawler

Crawling AJAX and JavaScript Pages with Selenium.

Web Scraping Best Practices

Troubleshooting

Summary and Conclusion

Requirements

  • Programming experience, preferably in Python. If participants have programming experience in a language other than Python, the training can be extended to include more introductory Python exercises.

Audience

  • Developers
 7 Hours

Number of participants


Price per participant

Testimonials (1)

Upcoming Courses

Related Categories