From 3ab3a602ac93ac5f1b169f692e16c5b2e8361f10 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 11 Dec 2017 18:50:45 +0100
Subject: [PATCH 001/100] Initial commit

---
 README.md | 2 ++
 1 file changed, 2 insertions(+)
 create mode 100644 README.md
diff --git a/README.md b/README.md
new file mode 100644
index 0000000..e28fc24
--- /dev/null
+++ b/README.md
@@ -0,0 +1,2 @@
+# safaribooks
+Download and read in EPUB your favorites books from Safari Books Online.

From e89b88b068ea39aa42ffb13250ad43a47e56c52a Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 11 Dec 2017 18:51:21 +0100
Subject: [PATCH 002/100] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index e28fc24..c7ad817 100644
--- a/README.md
+++ b/README.md
@@ -1,2 +1,2 @@
-# safaribooks
+# SafariBooks
 Download and read in EPUB your favorites books from Safari Books Online.

From a970ad8ead5926a59771ce56ec6f1b0880fb8e84 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 11 Dec 2017 19:22:12 +0100
Subject: [PATCH 003/100] Update README.md

---
 README.md | 33 +++++++++++++++++++++++++++++++++
 1 file changed, 33 insertions(+)

diff --git a/README.md b/README.md
index c7ad817..710cb60 100644
--- a/README.md
+++ b/README.md
@@ -1,2 +1,35 @@
 # SafariBooks
+Download and read in EPUB your favorites books from [Safari Books Online](https://www.safaribooksonline.com).
+
+## Usage:
+```bash
+~$ python3 safaribooks.py --cred "account_mail@mail.com:password01" XXXXXXXXXXXXX
+```
+The book ID (the X-es) are the digits that you can find in the URL.  
+Ex: `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/ch01.html`  
+  
+The first time you use the program, you have to specify your SafariBooksOnline account credentials. 
+Next times you want to download a book, before session expires, you can omit the credential because the program save your session cookies in a file called `cookies.json`.  
+Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
+If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`. 
+
+#### List of program option:
+```text
+usage: safaribooks.py [--cred <EMAIL:PASS>] [--no-cookies] [--preserve-log] [--help] <BOOK ID>
+
 Download and read in EPUB your favorites books from Safari Books Online.
+
+positional arguments:
+  <BOOK ID>            Book digits ID that you want to download. You can find it in the URL (X-es):
+                       `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/cover.html`
+
+optional arguments:
+  --cred <EMAIL:PASS>  Credentials used to perform the login on SafariBooksOnline.
+                       Es. ` --cred "account_mail@mail.com:password01" `.
+  --no-cookies         Prevent your session data to be saved into `cookies.json` file.
+  --preserve-log       Leave the `info.log` file even if there isn't any error.
+  --help               Show this help message.
+```
+
+## Example:
+\# TODO

From 9179364a864b01cc1c72810625275be4e2e71c6a Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 12:18:03 +0100
Subject: [PATCH 004/100] Update README.md

---
 README.md | 117 +++++++++++++++++++++++++++++++++++++++++++++---------
 1 file changed, 98 insertions(+), 19 deletions(-)

diff --git a/README.md b/README.md
index 710cb60..8eedf14 100644
--- a/README.md
+++ b/README.md
@@ -1,35 +1,114 @@
 # SafariBooks
-Download and read in EPUB your favorites books from [Safari Books Online](https://www.safaribooksonline.com).
+Download and generate an EPUB of your favorite books from [Safari Books Online](https://www.safaribooksonline.com) library.  
+Use this program only for personal and/or educational purpose.  
 
+## Requirements & setup:
+```shell
+$ git clone https://github.com/lorenzodifuccia/safaribooks.git
+Cloning into 'safaribooks'...
+
+$ cd safaribooks/
+$ pip3 install -r requirements.txt
+```  
+
+The program depends of only two Python 3 modules:
+```python3
+lxml>=4.1.1
+requests>=2.18.4
+```
+  
 ## Usage:
-```bash
-~$ python3 safaribooks.py --cred "account_mail@mail.com:password01" XXXXXXXXXXXXX
+It's really simple to use, just choose a book from the library and replace in the following command:
+  * X-es with its ID, 
+  * `email:password`  with your own. 
+
+```shell
+$ python3 safaribooks.py --cred "account_mail@mail.com:password01" XXXXXXXXXXXXX
 ```
-The book ID (the X-es) are the digits that you can find in the URL.  
-Ex: `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/ch01.html`  
+
+The ID are the digits that you can find in the URL of the book description page:  
+`https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`  
+Like: `https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/`  
+  
+The first time you'll use the program, you'll have to specify your Safari Books Online account credentials. 
+For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json`.  
   
-The first time you use the program, you have to specify your SafariBooksOnline account credentials. 
-Next times you want to download a book, before session expires, you can omit the credential because the program save your session cookies in a file called `cookies.json`.  
 Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
-If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`. 
+If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.  
 
-#### List of program option:
-```text
-usage: safaribooks.py [--cred <EMAIL:PASS>] [--no-cookies] [--preserve-log] [--help] <BOOK ID>
+### Program options:
+```shell
+$ python3 safaribooks.py --help
+usage: safaribooks.py [--cred <EMAIL:PASS>] [--no-cookies] [--no-kindle]
+                      [--preserve-log] [--help]
+                      <BOOK ID>
 
-Download and read in EPUB your favorites books from Safari Books Online.
+Download and generate an EPUB of your favorite books from Safari Books Online.
 
 positional arguments:
-  <BOOK ID>            Book digits ID that you want to download. You can find it in the URL (X-es):
-                       `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/cover.html`
+  <BOOK ID>            Book digits ID that you want to download.
+                       You can find it in the URL (X-es):
+                       `https://www.safaribooksonline.com/library/view/book-
+                       name/XXXXXXXXXXXXX/`
 
 optional arguments:
-  --cred <EMAIL:PASS>  Credentials used to perform the login on SafariBooksOnline.
+  --cred <EMAIL:PASS>  Credentials used to perform the auth login on Safari
+                       Books Online.
                        Es. ` --cred "account_mail@mail.com:password01" `.
-  --no-cookies         Prevent your session data to be saved into `cookies.json` file.
-  --preserve-log       Leave the `info.log` file even if there isn't any error.
+  --no-cookies         Prevent your session data to be saved into
+                       `cookies.json` file.
+  --no-kindle          Remove some CSS rules that block overflow on `table`
+                       and `pre` elements. Use this option if you're not going
+                       to export the EPUB to E-Readers like Amazon Kindle.
+  --preserve-log       Leave the `info.log` file even if there isn't any
+                       error.
   --help               Show this help message.
 ```
 
-## Example:
-\# TODO
+  * ## Example: [Test-Driven Development with Python, 2nd Edition](https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/)  
+    ```shell
+    $ python3 safaribooks.py --cred "XXXX@gmail.com:XXXXX" 9781491958698
+
+           ____     ___         _ 
+          / __/__ _/ _/__ _____(_)
+         _\ \/ _ `/ _/ _ `/ __/ / 
+        /___/\_,_/_/ \_,_/_/ /_/  
+          / _ )___  ___  / /__ ___
+         / _  / _ \/ _ \/  '_/(_-<
+        /____/\___/\___/_/\_\/___/
+
+    ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    [-] Logging into Safari Books Online...                                         
+    [-] Title: Test-Driven Development with Python, 2nd Edition                     
+    [-] Authors: Harry J.W. Percival                                                
+    [-] Identifier: 9781491958698                                                   
+    [-] ISBN: 9781491958704                                                         
+    [-] Publishers: O'Reilly Media, Inc.                                            
+    [-] Rights: Copyright © O'Reilly Media, Inc.                                    
+    [-] Description: By taking you through the development of a real web application from beginning to end, the second edition of this hands-on guide demonstrates the practical advantages of test-driven development (TDD) with Python. You’ll learn how to write and run tests before building each part of your app, and then develop the minimum amount of code required to pass those tests. The result? Clean code that works.In the process, you’ll learn the basics of Django, Selenium, Git, jQuery, and Mock, along with curre...
+    [-] URL: https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/
+    [*] Found 73 chapters!                                                          
+    [*] Output directory:                                                           
+        /XXXX/XXXX/Test-Driven Development with Python, 2nd Edition
+    [-] Downloading book contents...                                                
+        [#########################################----------------------------]  60%
+    ...
+    [-] Creating EPUB file...                                                       
+    [*] Done: Test-Driven Development with Python, 2nd Edition.epub                 
+
+        If you like it, please * this project on GitHub to make it known:
+            https://github.com/lorenzodifuccia/safaribooks
+        e don't forget to renew your Safari Books Online subscription:
+            https://www.safaribooksonline.com/signup/
+
+    [!] Bye!!
+    ```  
+     The result will be (opening the EPUB file with [Calibre](https://calibre-ebook.com/)):  
+
+    ![Book Appearance](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_example01_TDD.png "Book opened with Calibre")  
+ 
+  * ## Example: `--no-kindle` option
+    ```bash
+    $ python3 safaribooks.py --no-kindle 9781491958698
+    ```  
+    ![NoKindle Option](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_example02_NoKindle.png "Version comparison")  

From 662e0020ee9515ff4dfc3cc27d6e4ed279c7c980 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 13:23:57 +0100
Subject: [PATCH 005/100] Update README.md

---
 README.md | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 8eedf14..c571ee2 100644
--- a/README.md
+++ b/README.md
@@ -36,6 +36,11 @@ For the next times you'll download a book, before session expires, you can omit
 Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
 If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.  
 
+The program default options are thought for ensure best compatibilities for who want to export the `EPUB` to E-Readers like Amazon Kindle.  
+If you want to do it, I suggest you to convert the `EPUB` to `AZW3` file with [Calibre](https://calibre-ebook.com/).  
+You can also convert the book to `MOBI` and if you'll convert it with Calibre be sure to select the `Ignore margins`:  
+![Calibre IgnoreMargins](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_calibre_IgnoreMargins.png "Select Ignore margins")  
+
 ### Program options:
 ```shell
 $ python3 safaribooks.py --help
@@ -103,7 +108,7 @@ optional arguments:
 
     [!] Bye!!
     ```  
-     The result will be (opening the EPUB file with [Calibre](https://calibre-ebook.com/)):  
+     The result will be (opening the `EPUB` file with Calibre):  
 
     ![Book Appearance](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_example01_TDD.png "Book opened with Calibre")  
  

From 614311653e9dad9a7ea0b499da9416442ff6f7fb Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 13:26:37 +0100
Subject: [PATCH 006/100] Update README.md

---
 README.md | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index c571ee2..7682824 100644
--- a/README.md
+++ b/README.md
@@ -38,9 +38,10 @@ If you don't want to cache the cookies, just use the `--no-cookies` option and p
 
 The program default options are thought for ensure best compatibilities for who want to export the `EPUB` to E-Readers like Amazon Kindle.  
 If you want to do it, I suggest you to convert the `EPUB` to `AZW3` file with [Calibre](https://calibre-ebook.com/).  
-You can also convert the book to `MOBI` and if you'll convert it with Calibre be sure to select the `Ignore margins`:  
+You can also convert the book to `MOBI` and if you'll convert it with Calibre be sure to select `Ignore margins`:  
+  
 ![Calibre IgnoreMargins](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_calibre_IgnoreMargins.png "Select Ignore margins")  
-
+  
 ### Program options:
 ```shell
 $ python3 safaribooks.py --help

From aa56ce4d4d4d3fe7b2192da6c1878728c90b5278 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 13:27:27 +0100
Subject: [PATCH 007/100] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 7682824..7526050 100644
--- a/README.md
+++ b/README.md
@@ -38,7 +38,7 @@ If you don't want to cache the cookies, just use the `--no-cookies` option and p
 
 The program default options are thought for ensure best compatibilities for who want to export the `EPUB` to E-Readers like Amazon Kindle.  
 If you want to do it, I suggest you to convert the `EPUB` to `AZW3` file with [Calibre](https://calibre-ebook.com/).  
-You can also convert the book to `MOBI` and if you'll convert it with Calibre be sure to select `Ignore margins`:  
+You can also convert the book to `MOBI` and if you'll do it with Calibre be sure to select `Ignore margins`:  
   
 ![Calibre IgnoreMargins](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_calibre_IgnoreMargins.png "Select Ignore margins")  
   

From 2e82d2edaa2432c9525b60fbfea1a2d9692f0712 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 15:14:52 +0100
Subject: [PATCH 008/100] Update README.md

---
 README.md | 38 +++++++++++++++++++++++++++-----------
 1 file changed, 27 insertions(+), 11 deletions(-)

diff --git a/README.md b/README.md
index 7526050..b8da7f7 100644
--- a/README.md
+++ b/README.md
@@ -1,8 +1,13 @@
 # SafariBooks
-Download and generate an EPUB of your favorite books from [Safari Books Online](https://www.safaribooksonline.com) library.  
-Use this program only for personal and/or educational purpose.  
+Download and generate an *EPUB* of your favorite books from [*Safari Books Online*](https://www.safaribooksonline.com) library.  
+Use this program only for *personal* and/or *educational* purpose.  
 
-## Requirements & setup:
+## Overview:
+  * [Requirements & Setup]()
+  * [Usage]()
+  * [Examples]()
+
+## Requirements & Setup:
 ```shell
 $ git clone https://github.com/lorenzodifuccia/safaribooks.git
 Cloning into 'safaribooks'...
@@ -11,7 +16,7 @@ $ cd safaribooks/
 $ pip3 install -r requirements.txt
 ```  
 
-The program depends of only two Python 3 modules:
+The program depends of only two **Python 3** modules:
 ```python3
 lxml>=4.1.1
 requests>=2.18.4
@@ -20,13 +25,13 @@ requests>=2.18.4
 ## Usage:
 It's really simple to use, just choose a book from the library and replace in the following command:
   * X-es with its ID, 
-  * `email:password`  with your own. 
+  * `email:password` with your own. 
 
 ```shell
 $ python3 safaribooks.py --cred "account_mail@mail.com:password01" XXXXXXXXXXXXX
 ```
 
-The ID are the digits that you can find in the URL of the book description page:  
+The ID are the digits that you find in the URL of the book description page:  
 `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`  
 Like: `https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/`  
   
@@ -37,12 +42,14 @@ Pay attention if you use a shared PC, because everyone that has access to your f
 If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.  
 
 The program default options are thought for ensure best compatibilities for who want to export the `EPUB` to E-Readers like Amazon Kindle.  
-If you want to do it, I suggest you to convert the `EPUB` to `AZW3` file with [Calibre](https://calibre-ebook.com/).  
-You can also convert the book to `MOBI` and if you'll do it with Calibre be sure to select `Ignore margins`:  
+If you want to do it, I suggest you to convert the `EPUB` to `AZW3` with [Calibre](https://calibre-ebook.com/).  
+You can also convert the book to `MOBI` and if you'll do it with Calibre be sure to select `Ignore margins` in the conversion options:  
   
 ![Calibre IgnoreMargins](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_calibre_IgnoreMargins.png "Select Ignore margins")  
+
+In the other hand, if you're not going to export the `EPUB`, you can use the `--no-kindle` option to remove the CSS that blocks overflow on `table` and `pre` elements, see below in the examples.
   
-### Program options:
+#### Program options:
 ```shell
 $ python3 safaribooks.py --help
 usage: safaribooks.py [--cred <EMAIL:PASS>] [--no-cookies] [--no-kindle]
@@ -71,7 +78,8 @@ optional arguments:
   --help               Show this help message.
 ```
 
-  * ## Example: [Test-Driven Development with Python, 2nd Edition](https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/)  
+## Examples:
+  * ## Download [Test-Driven Development with Python, 2nd Edition](https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/):  
     ```shell
     $ python3 safaribooks.py --cred "XXXX@gmail.com:XXXXX" 9781491958698
 
@@ -113,8 +121,16 @@ optional arguments:
 
     ![Book Appearance](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_example01_TDD.png "Book opened with Calibre")  
  
-  * ## Example: `--no-kindle` option
+  * ## Use or not the `--no-kindle` option:
     ```bash
     $ python3 safaribooks.py --no-kindle 9781491958698
     ```  
+    
     ![NoKindle Option](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_example02_NoKindle.png "Version comparison")  
+    
+---  
+  
+## Thanks!!
+For any kind of problem, please don't hesitate to open an issue here on *GitHub*.  
+  
+*Lorenzo Di Fuccia*

From f9f6686ffadffd45dfe318a686177569b47da2d4 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 15:16:12 +0100
Subject: [PATCH 009/100] Update README.md

---
 README.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/README.md b/README.md
index b8da7f7..194a2d2 100644
--- a/README.md
+++ b/README.md
@@ -3,9 +3,9 @@ Download and generate an *EPUB* of your favorite books from [*Safari Books Onlin
 Use this program only for *personal* and/or *educational* purpose.  
 
 ## Overview:
-  * [Requirements & Setup]()
-  * [Usage]()
-  * [Examples]()
+  * [Requirements & Setup](#requirements--setup)
+  * [Usage](#usage)
+  * [Examples](#examples)
 
 ## Requirements & Setup:
 ```shell

From d27d8227a4b4686961611d792712666e30ada021 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 15:19:36 +0100
Subject: [PATCH 010/100] Update README.md

---
 README.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 194a2d2..8128ecf 100644
--- a/README.md
+++ b/README.md
@@ -5,7 +5,8 @@ Use this program only for *personal* and/or *educational* purpose.
 ## Overview:
   * [Requirements & Setup](#requirements--setup)
   * [Usage](#usage)
-  * [Examples](#examples)
+  * [Example: Download *Test-Driven Development with Python, 2nd Edition*](#download-test-driven-development-with-python-2nd-edition)
+  * [Example: Use or not the `--no-kindle` option](#use-or-not-the---no-kindle-option)
 
 ## Requirements & Setup:
 ```shell

From 5145fa293e0e17f729d9593409982a8068f7e037 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 16:12:08 +0100
Subject: [PATCH 011/100] Update README.md

---
 README.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 8128ecf..a2bb2aa 100644
--- a/README.md
+++ b/README.md
@@ -126,8 +126,9 @@ optional arguments:
     ```bash
     $ python3 safaribooks.py --no-kindle 9781491958698
     ```  
+    On the left book created with `--no-kindle` option, on the right without (default):  
     
-    ![NoKindle Option](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_example02_NoKindle.png "Version comparison")  
+    ![NoKindle Option](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_example02_NoKindle.png "Version compare")  
     
 ---  
   

From ac297007a1788990eead8c393892eaa5a6826907 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 16:15:05 +0100
Subject: [PATCH 012/100] First release

---
 requirements.txt |   2 +
 safaribooks.py   | 831 +++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 833 insertions(+)
 create mode 100644 requirements.txt
 create mode 100644 safaribooks.py

diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 0000000..6964772
--- /dev/null
+++ b/requirements.txt
@@ -0,0 +1,2 @@
+lxml>=4.1.1
+requests>=2.18.4
diff --git a/safaribooks.py b/safaribooks.py
new file mode 100644
index 0000000..11b35e2
--- /dev/null
+++ b/safaribooks.py
@@ -0,0 +1,831 @@
+import os
+import sys
+import json
+import shutil
+import logging
+import argparse
+import requests
+from lxml import html
+from html import escape
+from random import random
+from urllib.parse import urljoin, urlsplit
+from multiprocessing import Process, Queue, Value
+
+
+PATH = os.path.dirname(os.path.realpath(__file__))
+COOKIES_FILE = os.path.join(PATH, "cookies.json")
+
+
+class Display:
+    BASE_FORMAT = logging.Formatter(
+        fmt="[%(asctime)s] %(message)s",
+        datefmt="%d/%b/%Y %H:%M:%S"
+    )
+
+    SH_DEFAULT = "\033[0m"
+    SH_YELLOW = "\033[33m"
+    SH_BG_RED = "\033[41m"
+    SH_BG_YELLOW = "\033[43m"
+
+    def __init__(self):
+        self.columns, _ = shutil.get_terminal_size()
+
+        self.logger = logging.getLogger("SafariBooks")
+        self.logger.setLevel(logging.INFO)
+        logs_handler = logging.FileHandler(filename=os.path.join(PATH, "info.log"))
+        logs_handler.setFormatter(self.BASE_FORMAT)
+        logs_handler.setLevel(logging.INFO)
+        self.logger.addHandler(logs_handler)
+
+        self.logger.info("** Welcome to SafariBooks! **")
+
+        self.book_ad_info = False
+        self.css_ad_info = Value("i", 0)
+        self.images_ad_info = Value("i", 0)
+        self.in_error = False
+
+        self.state_status = Value("i", 0)
+        sys.excepthook = self.unhandled_exception
+
+    def log(self, message):
+        self.logger.info(str(message))
+
+    def out(self, put):
+        sys.stdout.write("\r" + " " * self.columns + "\r" + put + "\n")
+
+    def info(self, message, state=False):
+        self.log(message)
+        output = (self.SH_YELLOW + "[*]" + self.SH_DEFAULT if not state else
+                  self.SH_BG_YELLOW + "[-]" + self.SH_DEFAULT) + " %s" % message
+        self.out(output)
+
+    def error(self, error):
+        if not self.in_error:
+            self.in_error = True
+
+        self.log(error)
+        output = self.SH_BG_RED + "[#]" + self.SH_DEFAULT + " %s" % error
+        self.out(output)
+
+    def exit(self, error):
+        self.error(str(error))
+        output = (self.SH_YELLOW + "[+]" + self.SH_DEFAULT +
+                  " Please delete all the `<BOOK NAME>/OEBPS/*.xhtml`"
+                  " files and restart the program.")
+        self.out(output)
+
+        output = self.SH_BG_RED + "[!]" + self.SH_DEFAULT + " Aborting..."
+        self.out(output)
+        sys.exit(128)
+
+    def unhandled_exception(self, _, o, __):
+        self.exit("Unhandled Exception: %s (type: %s)" % (o, o.__class__.__name__))
+
+    def intro(self):
+        output = self.SH_YELLOW + """
+       ____     ___         _ 
+      / __/__ _/ _/__ _____(_)
+     _\ \/ _ `/ _/ _ `/ __/ / 
+    /___/\_,_/_/ \_,_/_/ /_/  
+      / _ )___  ___  / /__ ___
+     / _  / _ \/ _ \/  '_/(_-<
+    /____/\___/\___/_/\_\/___/
+""" + self.SH_DEFAULT
+        output += "\n" + "~" * (self.columns // 2)
+        self.out(output)
+
+    def parse_description(self, desc):
+        try:
+            return html.fromstring(desc).text_content()
+
+        except (html.etree.ParseError, html.etree.ParserError) as e:
+            self.log("Error parsing the description: %s" % e)
+            return "n/d"
+
+    def book_info(self, info):
+        description = self.parse_description(info["description"]).replace("\n", " ")
+        for t in [
+            ("Title", info["title"]), ("Authors", ", ".join(aut["name"] for aut in info["authors"])),
+            ("Identifier", info["identifier"]), ("ISBN", info["isbn"]),
+            ("Publishers", ", ".join(pub["name"] for pub in info["publishers"])),
+            ("Rights", info["rights"]),
+            ("Description", description[:500] + "..." if len(description) >= 500 else description),
+            ("URL", info["web_url"])
+        ]:
+            self.info("{0}: {1}".format(t[0], t[1]), True)
+
+    def state(self, origin, done):
+        progress = int(done * 100 / origin)
+        bar = int(progress * (self.columns - 11) / 100)
+        if self.state_status.value < progress:
+            self.state_status.value = progress
+            sys.stdout.write(
+                "\r    " + self.SH_BG_YELLOW + "[" + ("#" * bar).ljust(self.columns - 11, "-") + "]" +
+                self.SH_DEFAULT + ("%4s" % progress) + "%" + ("\n" if progress == 100 else "")
+            )
+
+    def done(self, epub_file):
+        self.info("Done: %s\n\n"
+                  "    If you like it, please * this project on GitHub to make it known:\n"
+                  "        https://github.com/lorenzodifuccia/safaribooks\n"
+                  "    e don't forget to renew your Safari Books Online subscription:\n"
+                  "        https://www.safaribooksonline.com/signup/\n\n" % epub_file +
+                  self.SH_BG_RED + "[!]" + self.SH_DEFAULT + " Bye!!")
+
+    @staticmethod
+    def api_error(response):
+        message = "API: "
+        if "detail" in response and "Not found" in response["detail"]:
+            message += "book's not present in Safari Books Online.\n" \
+                       "    The book identifier are the digits that you can find in the URL:\n" \
+                       "    `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`"
+
+        else:
+            os.remove(COOKIES_FILE)
+            message += "Out-of-Session%s.\n" % (" (%s)" % response["detail"]) if "detail" in response else "" +\
+                       Display.SH_YELLOW + "[+]" + Display.SH_DEFAULT + \
+                       " Use the `--cred` option in order to perform the auth login to Safari Books Online."
+
+        return message
+
+
+class SafariBooks:
+
+    HEADERS = {
+        "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8",
+        "accept-encoding": "gzip, deflate, br",
+        "accept-language": "it-IT,it;q=0.9,en-US;q=0.8,en;q=0.7",
+        "cache-control": "no-cache",
+        "cookie": "",
+        "pragma": "no-cache",
+        "referer": "https://www.safaribooksonline.com/home/",
+        "upgrade-insecure-requests": "1",
+        "user-agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) "
+                      "Chrome/62.0.3202.94 Safari/537.36"
+    }
+
+    BASE_URL = "https://www.safaribooksonline.com"
+    LOGIN_URL = BASE_URL + "/accounts/login/"
+    API_TEMPLATE = BASE_URL + "/api/v1/book/{0}/"
+
+    BASE_01_HTML = "<!DOCTYPE html>\n" \
+                   "<html lang=\"en\" xml:lang=\"en\" xmlns=\"http://www.w3.org/1999/xhtml\"" \
+                   " xmlns:xsi=\"http://www.w3.org/2001/XMLSchema-instance\"" \
+                   " xsi:schemaLocation=\"http://www.w3.org/2002/06/xhtml2/" \
+                   " http://www.w3.org/MarkUp/SCHEMA/xhtml2.xsd\"" \
+                   " xmlns:epub=\"http://www.idpf.org/2007/ops\">\n" \
+                   "<head>\n" \
+                   "{0}\n" \
+                   "<style type=\"text/css\">" \
+                   "body{{background-color:#fbfbfb!important;margin:1em;}}" \
+                   "#sbo-rt-content *{{text-indent:0pt!important;}}"
+
+    KINDLE_HTML = "#sbo-rt-content *{{word-wrap:break-word!important;" \
+                  "word-break:break-word!important;}}#sbo-rt-content table,#sbo-rt-content pre" \
+                  "{{overflow-x:unset!important;overflow:unset!important;" \
+                  "overflow-y:unset!important;white-space:pre-wrap!important;}}"
+
+    BASE_02_HTML = "</style>" \
+                   "</head>\n" \
+                   "<body>{1}</body>\n</html>"
+
+    CONTAINER_XML = "<?xml version=\"1.0\"?>" \
+                    "<container version=\"1.0\" xmlns=\"urn:oasis:names:tc:opendocument:xmlns:container\">" \
+                    "<rootfiles>" \
+                    "<rootfile full-path=\"OEBPS/content.opf\" media-type=\"application/oebps-package+xml\" />" \
+                    "</rootfiles>" \
+                    "</container>"
+
+    # Format: ID, Title, Authors, Description, Subjects, Publisher, Rights, CoverId, MANIFEST, SPINE, CoverUrl
+    CONTENT_OPF = "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n" \
+                  "<package xmlns=\"http://www.idpf.org/2007/opf\" unique-identifier=\"bookid\" version=\"2.0\" >\n" \
+                  "<metadata xmlns:dc=\"http://purl.org/dc/elements/1.1/\" " \
+                  " xmlns:opf=\"http://www.idpf.org/2007/opf\">\n"\
+                  "<dc:title>{1}</dc:title>\n" \
+                  "{2}\n" \
+                  "<dc:description>{3}</dc:description>\n" \
+                  "{4}" \
+                  "<dc:publisher>{5}</dc:publisher>\n" \
+                  "<dc:rights>{6}</dc:rights>\n" \
+                  "<dc:language>en-US</dc:language>\n" \
+                  "<dc:identifier id=\"bookid\">{0}</dc:identifier>\n" \
+                  "<meta name=\"cover\" content=\"{7}\"/>\n" \
+                  "</metadata>\n" \
+                  "<manifest>\n" \
+                  "<item id=\"ncx\" href=\"toc.ncx\" media-type=\"application/x-dtbncx+xml\" />\n" \
+                  "{8}\n" \
+                  "</manifest>\n" \
+                  "<spine toc=\"ncx\">\n{9}</spine>\n" \
+                  "<guide><reference href=\"{10}\" title=\"Cover\" type=\"cover\" /></guide>\n" \
+                  "</package>"
+
+    # Format: ID, Depth, Title, Author, NAVMAP
+    TOC_NCX = "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\" ?>" \
+              "<!DOCTYPE ncx PUBLIC \"-//NISO//DTD ncx 2005-1//EN\"" \
+              " \"http://www.daisy.org/z3986/2005/ncx-2005-1.dtd\">" \
+              "<ncx xmlns=\"http://www.daisy.org/z3986/2005/ncx/\" version=\"2005-1\">" \
+              "<head>" \
+              "<meta content=\"ID:ISBN:{0}\" name=\"dtb:uid\"/>" \
+              "<meta content=\"{1}\" name=\"dtb:depth\"/>" \
+              "<meta content=\"0\" name=\"dtb:totalPageCount\"/>" \
+              "<meta content=\"0\" name=\"dtb:maxPageNumber\"/>" \
+              "</head>" \
+              "<docTitle><text>{2}</text></docTitle>" \
+              "<docAuthor><text>{3}</text></docAuthor>" \
+              "<navMap>{4}</navMap>" \
+              "</ncx>"
+
+    def __init__(self, args):
+        self.args = args
+        self.display = Display()
+        self.display.intro()
+
+        self.cookies = {}
+
+        if not args.cred:
+            if not os.path.isfile(COOKIES_FILE):
+                self.display.exit("Login: unable to find cookies file.\n"
+                                  "    Please use the --cred option to perform the login.")
+
+            self.cookies = json.load(open(COOKIES_FILE))
+
+        else:
+            self.display.info("Logging into Safari Books Online...", state=True)
+            self.do_login(*[c.replace("'", "").replace('"', "") for c in args.cred])
+            if not args.no_cookies:
+                json.dump(self.cookies, open(COOKIES_FILE, "w"))
+
+        self.book_id = args.bookid
+        self.api_url = self.API_TEMPLATE.format(self.book_id)
+        self.book_info = self.get_book_info()
+        self.display.book_info(self.book_info)
+        self.book_chapters = self.get_book_chapters()
+        self.display.info("Found %s chapters!" % len(self.book_chapters))
+        self.chapters_queue = self.book_chapters[:]
+
+        self.book_title = self.book_info["title"]
+        self.base_url = self.book_info["web_url"]
+
+        self.BOOK_PATH = os.path.join(PATH, self.book_title)
+        self.create_dirs()
+        self.display.info("Output directory:\n    %s" % self.BOOK_PATH)
+
+        self.chapter_title = ""
+        self.filename = ""
+        self.css = []
+        self.images = []
+
+        self.display.info("Downloading book contents...", state=True)
+        self.BASE_HTML = self.BASE_01_HTML + (self.KINDLE_HTML if not args.no_kindle else "") + self.BASE_02_HTML
+        self.get()
+
+        self.css_path = ""
+        self.images_path = ""
+        self.cover = ""
+
+        self.display.info("Downloading book CSSs...", state=True)
+        self.collect_css()
+        self.display.info("Downloading book images...", state=True)
+        self.collect_images()
+
+        self.display.info("Creating EPUB file...", state=True)
+        self.create_epub()
+
+        if not args.no_cookies:
+            json.dump(self.cookies, open(COOKIES_FILE, "w"))
+
+        self.display.done(self.book_title + ".epub")
+
+        if not self.display.in_error and not args.log:
+            os.remove(os.path.join(PATH, "info.log"))
+
+        sys.exit(0)
+
+    def return_cookies(self):
+        return " ".join(["{0}={1};".format(k, v) for k, v in self.cookies.items()])
+
+    def return_headers(self, url):
+        if "safaribooksonline" in urlsplit(url).netloc:
+            self.HEADERS["cookie"] = self.return_cookies()
+
+        else:
+            self.HEADERS["cookie"] = ""
+
+        return self.HEADERS
+
+    def update_cookies(self, jar):
+        for cookie in jar:
+            self.cookies.update({
+                cookie.name: cookie.value
+            })
+
+    def requests_provider(self, url, post=False, data=None, update_cookies=True, **kwargs):
+        try:
+            response = getattr(requests, "post" if post else "get")(
+                url,
+                headers=self.return_headers(url),
+                data=data,
+                **kwargs
+            )
+
+        except (requests.ConnectionError, requests.ConnectTimeout, requests.RequestException) as request_exception:
+            self.display.error(str(request_exception))
+            return 0
+
+        if update_cookies:
+            self.update_cookies(response.cookies)
+
+        return response
+
+    def do_login(self, email, password):
+        response = self.requests_provider(self.BASE_URL)
+        if response == 0:
+            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
+
+        csrf = []
+        try:
+            csrf = html.fromstring(response.text).xpath("//input[@name='csrfmiddlewaretoken'][@value]")
+
+        except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
+            self.display.error(parsing_error)
+            self.display.exit(
+                "Login: error trying to parse the home of Safari Books Online."
+            )
+
+        if not len(csrf):
+            self.display.exit("Login: no CSRF Token found in the page."
+                              " Unable to continue the login."
+                              " Try again...")
+
+        csrf = csrf[0].attrib["value"]
+        response = self.requests_provider(
+            self.LOGIN_URL,
+            post=True,
+            data=(
+                ("csrfmiddlewaretoken", ""), ("csrfmiddlewaretoken", csrf),
+                ("email", email), ("password1", password),
+                ("is_login_form", "true"), ("leaveblank", ""),
+                ("dontchange", "http://")
+            ),
+            allow_redirects=False
+        )
+
+        if response == 0:
+            self.display.exit("Login: unable to perform auth to Safari Books Online.\n    Try again...")
+
+        if response.status_code != 302:
+            try:
+                error_page = html.fromstring(response.text)
+                errors_message = error_page.xpath("//ul[@class='errorlist']//li/text()")
+                recaptcha = error_page.xpath("//div[@class='g-recaptcha']")
+                messages = (["    `%s`" % error for error in errors_message
+                            if "password" in error or "email" in error] if len(errors_message) else []) +\
+                           (["    `ReCaptcha required (wait or do logout from the website).`"] if len(recaptcha) else[])
+                self.display.exit("Login: unable to perform auth login to Safari Books Online.\n" +
+                                  self.display.SH_YELLOW + "[*]" + self.display.SH_DEFAULT + " Details:\n"
+                                  "%s" % "\n".join(messages if len(messages) else ["    Unexpected error!"]))
+            except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
+                self.display.error(parsing_error)
+                self.display.exit(
+                    "Login: your login went wrong and it encountered in an error"
+                    " trying to parse the login details of Safari Books Online. Try again..."
+                )
+
+    def get_book_info(self):
+        response = self.requests_provider(self.api_url)
+        if response == 0:
+            self.display.exit("API: unable to retrieve book info.")
+
+        response = response.json()
+        if not isinstance(response, dict) or len(response.keys()) == 1:
+            self.display.exit(self.display.api_error(response))
+
+        if "last_chapter_read" in response:
+            del response["last_chapter_read"]
+
+        return response
+
+    def get_book_chapters(self, page=0):
+        response = self.requests_provider(urljoin(self.api_url, "chapter/" + ("" if not page else "?page=%s" % page)))
+        if response == 0:
+            self.display.exit("API: unable to retrieve book chapters.")
+
+        response = response.json()
+
+        if not isinstance(response, dict) or len(response.keys()) == 1:
+            self.display.exit(self.display.api_error(response))
+
+        if "results" not in response or not len(response["results"]):
+            self.display.exit("API: unable to retrieve book chapters.")
+
+        result = []
+        result.extend([c for c in response["results"] if "cover." in c["filename"]])
+        for c in result:
+            del response["results"][response["results"].index(c)]
+
+        result += response["results"]   
+        return result + (self.get_book_chapters(page + 1) if response["next"] else [])
+
+    def get_html(self, url):
+        response = self.requests_provider(url)
+        if response == 0:
+            self.display.exit(
+                "Crawler: error trying to retrieve this page: %s (%s)\n    From: %s" %
+                (self.filename, self.chapter_title, url)
+            )
+
+        root = None
+        try:
+            root = html.fromstring(response.text, base_url=self.BASE_URL)
+
+        except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
+            self.display.error(parsing_error)
+            self.display.exit(
+                "Crawler: error trying to parse this page: %s (%s)\n    From: %s" %
+                (self.filename, self.chapter_title, url)
+            )
+
+        return root
+
+    def link_replace(self, link):
+        if link[0] == "/" and ("cover" in link or "images" in link or "graphics" in link
+                               or link[-3:] in ["jpg", "jpeg", "png"]):
+            self.images.append(link)
+            self.display.log("Crawler: found a new image at %s" % link)
+            image = link.split("/")[-1]
+            return "Images/" + image
+
+        elif link[0] not in ["/", "h"]:
+            return link.replace(".html", ".xhtml")
+
+        return link
+
+    def parse_html(self, root):
+        if random() > 0.5:
+            if len(root.xpath("//div[@class='controls']/a/text()")):
+                self.display.exit(self.display.api_error(" "))
+
+        book_content = root.xpath("//div[@id='sbo-rt-content']")
+        if not len(book_content):
+            self.display.exit(
+                "Parser: book content's corrupted or not present: %s (%s)" %
+                (self.filename, self.chapter_title)
+            )
+
+        page_css = ""
+        stylesheet_links = root.xpath("//link[@rel='stylesheet']")
+        if len(stylesheet_links):
+            stylesheet_count = 0
+            for s in stylesheet_links:
+                css_url = urljoin("https:", s.attrib["href"]) if s.attrib["href"][:2] == "//" \
+                    else urljoin(self.base_url, s.attrib["href"])
+
+                if css_url not in self.css:
+                    self.css.append(css_url)
+                    self.display.log("Crawler: found a new CSS at %s" % css_url)
+
+                stylesheet_count += 1
+                page_css += "<link href=\"Styles/Style{0:0>2}.css\" " \
+                            "rel=\"stylesheet\" type=\"text/css\" />\n".format(stylesheet_count)
+
+        stylesheets = root.xpath("//style")
+        if len(stylesheets):
+            for css in stylesheets:
+                if "data-template" in css.attrib and len(css.attrib["data-template"]):
+                    css.text = css.attrib["data-template"]
+                    del css.attrib["data-template"]
+
+                try:
+                    page_css += html.tostring(css, method="xml", encoding='unicode') + "\n"
+
+                except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
+                    self.display.error(parsing_error)
+                    self.display.exit(
+                        "Parser: error trying to parse one CSS found in this page: %s (%s)" %
+                        (self.filename, self.chapter_title)
+                    )
+
+        book_content = book_content[0]
+        book_content.rewrite_links(self.link_replace)
+
+        xhtml = None
+        try:
+            xhtml = html.tostring(book_content, method="xml", encoding='unicode')
+
+        except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
+            self.display.error(parsing_error)
+            self.display.exit(
+                "Parser: error trying to parse HTML of this page: %s (%s)" %
+                (self.filename, self.chapter_title)
+            )
+
+        return page_css, xhtml
+
+    def create_dirs(self):
+        if os.path.isdir(self.BOOK_PATH):
+            self.display.log("Book directory already exists: %s" % self.book_title)
+
+        else:
+            os.makedirs(self.BOOK_PATH)
+
+        oebps = os.path.join(self.BOOK_PATH, "OEBPS")
+        if not os.path.isdir(oebps):
+            self.display.book_ad_info = True
+            os.makedirs(oebps)
+
+    def save_page_html(self, contents):
+        self.filename = self.filename.replace(".html", ".xhtml")
+        open(os.path.join(self.BOOK_PATH, "OEBPS", self.filename), "w")\
+            .write(self.BASE_HTML.format(contents[0], contents[1]))
+        self.display.log("Created: %s" % self.filename)
+
+    def get(self):
+        if not len(self.chapters_queue):
+            return
+
+        next_chapter = self.chapters_queue.pop(0)
+        self.chapter_title = next_chapter["title"]
+        self.filename = next_chapter["filename"]
+
+        if os.path.isfile(os.path.join(self.BOOK_PATH, "OEBPS", self.filename.replace(".html", ".xhtml"))):
+            if not self.display.book_ad_info and \
+                    next_chapter not in self.book_chapters[:self.book_chapters.index(next_chapter)]:
+                self.display.info("File `%s` already exists.\n"
+                                  "    If you want to download again all the book%s,\n"
+                                  "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program." %
+                                  (self.filename.replace(".html", ".xhtml"),
+                                   " (especially because you selected the `--no-kindle` option)" if self.args.no_kindle
+                                   else ""))
+                self.display.book_ad_info = 1
+
+        else:
+            self.save_page_html(self.parse_html(self.get_html(urljoin(self.base_url, self.filename))))
+
+        self.display.state(len(self.book_chapters), len(self.book_chapters) - len(self.chapters_queue))
+        self.get()
+
+    def _thread_download_css(self, url, done_queue):
+        css_file = os.path.join(self.css_path, "Style{0:0>2}.css".format(self.css.index(url)))
+        if os.path.isfile(css_file):
+            if not self.display.css_ad_info.value and url not in self.css[:self.css.index(url)]:
+                self.display.info("File `%s` already exists.\n"
+                                  "    If you want to download again all the CSSs,\n"
+                                  "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` and `<BOOK NAME>/OEBPS/Styles/*`"
+                                  " files and restart the program." %
+                                  css_file)
+                self.display.css_ad_info.value = 1
+
+        else:
+            response = self.requests_provider(url, update_cookies=False)
+            if response == 0:
+                self.display.error("Error trying to retrieve this CSS: %s\n    From: %s" % (css_file, url))
+
+            with open(css_file, 'wb') as s:
+                for chunk in response.iter_content(1024):
+                    s.write(chunk)
+
+        done_queue.put(1)
+        self.display.state(len(self.css), done_queue.qsize())
+
+    def _thread_download_images(self, url, done_queue):
+        image_name = url.split("/")[-1]
+        image_path = os.path.join(self.images_path, image_name)
+        if os.path.isfile(image_path):
+            if not self.display.images_ad_info.value and url not in self.images[:self.images.index(url)]:
+                self.display.info("File `%s` already exists.\n"
+                                  "    If you want to download again all the images,\n"
+                                  "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` and `<BOOK NAME>/OEBPS/Images/*`"
+                                  " files and restart the program." %
+                                  image_name)
+                self.display.images_ad_info.value = 1
+
+        else:
+            response = self.requests_provider(urljoin(self.BASE_URL, url),
+                                              update_cookies=False,
+                                              stream=True)
+            if response == 0:
+                self.display.error("Error trying to retrieve this image: %s\n    From: %s" % (image_name, url))
+
+            with open(image_path, 'wb') as img:
+                for chunk in response.iter_content(1024):
+                    img.write(chunk)
+
+        done_queue.put(1)
+        self.display.state(len(self.images), done_queue.qsize())
+
+    def _start_multiprocessing(self, operation, full_queue, done_queue=None):
+        if not done_queue:
+            done_queue = Queue(0)
+
+        if len(full_queue) > 5:
+            for i in range(0, len(full_queue), 5):
+                self._start_multiprocessing(operation, full_queue[i:i+5], done_queue)
+
+        else:
+            process_queue = [Process(target=operation, args=(arg, done_queue)) for arg in full_queue]
+            for proc in process_queue:
+                proc.start()
+
+            for proc in process_queue:
+                proc.join()
+
+    def collect_css(self):
+        self.css_path = os.path.join(self.BOOK_PATH, "OEBPS", "Styles")
+        if os.path.isdir(self.css_path):
+            self.display.log("CSSs directory already exists: %s" % self.css_path)
+
+        else:
+            os.makedirs(self.css_path)
+            self.display.css_ad_info.value = 1
+
+        self.display.state_status.value = -1
+        self._start_multiprocessing(self._thread_download_css, self.css)
+
+    def collect_images(self):
+        self.images_path = os.path.join(self.BOOK_PATH, "OEBPS", "Images")
+        if os.path.isdir(self.images_path):
+            self.display.log("Images directory already exists: %s" % self.images_path)
+
+        else:
+            os.makedirs(self.images_path)
+            self.display.images_ad_info.value = 1
+
+        if self.display.book_ad_info == 1:
+            self.display.info("Some of the book contents were already downloaded.\n"
+                              "    If you want to be sure that all the images will be downloaded,\n"
+                              "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program.")
+
+        self.display.state_status.value = -1
+        self._start_multiprocessing(self._thread_download_images, self.images)
+
+    def create_content_opf(self):
+        self.cover = self.images[0] if len(self.images) else ""
+        self.css = next(os.walk(self.css_path))[2]
+        self.images = next(os.walk(self.images_path))[2]
+
+        manifest = []
+        spine = []
+        for c in self.book_chapters:
+            c["filename"] = c["filename"].replace(".html", ".xhtml")
+            item_id = escape("".join(c["filename"].split(".")[:-1]))
+            manifest.append("<item id=\"{0}\" href=\"{1}\" media-type=\"application/xhtml+xml\" />".format(
+                item_id, c["filename"]
+            ))
+            spine.append("<itemref idref=\"{0}\"/>".format(item_id))
+
+        alt_cover_id = False
+        for i in self.images:
+            dot_split = i.split(".")
+            head = "img_" + escape("".join(dot_split[:-1]))
+            extension = dot_split[-1]
+            manifest.append("<item id=\"{0}\" href=\"Images/{1}\" media-type=\"image/{2}\" />".format(
+                head, i, "jpeg" if "jp" in extension else extension
+            ))
+
+            if not alt_cover_id:
+                alt_cover_id = head
+
+        for i in range(1, len(self.css) + 1):
+            manifest.append("<item id=\"style_{0:0>2}\" href=\"Styles/Style{0:0>2}.css\" "
+                            "media-type=\"text/css\" />".format(i))
+
+        authors = "\n".join("<dc:creator opf:file-as=\"{0}\" opf:role=\"aut\">{0}</dc:creator>".format(
+            escape(aut["name"])
+        ) for aut in self.book_info["authors"])
+
+        subjects = "\n".join("<dc:subject>{0}</dc:subject>".format(escape(sub["name"]))
+                             for sub in self.book_info["subjects"])
+
+        return self.CONTENT_OPF.format(
+            (self.book_info["isbn"] if len(self.book_info["isbn"]) else self.book_id),
+            escape(self.book_title),
+            authors,
+            escape(self.book_info["description"]),
+            subjects,
+            ", ".join(escape(pub["name"]) for pub in self.book_info["publishers"]),
+            escape(self.book_info["rights"]),
+            self.cover if self.cover else alt_cover_id,
+            "\n".join(manifest),
+            "\n".join(spine),
+            self.book_chapters[0]["filename"].replace(".html", ".xhtml")
+        )
+
+    @staticmethod
+    def parse_toc(l, c=0, mx=0):
+        r = ""
+        for cc in l:
+            c += 1
+            if int(cc["depth"]) > mx:
+                mx = int(cc["depth"])
+
+            r += "<navPoint id=\"{0}\" playOrder=\"{1}\">" \
+                 "<navLabel><text>{2}</text></navLabel>" \
+                 "<content src=\"{3}\"/>".format(
+                    cc["fragment"] if len(cc["fragment"]) else cc["id"], c,
+                    escape(cc["label"]), cc["href"].replace(".html", ".xhtml")
+                 )
+
+            if cc["children"]:
+                sr, c, mx = SafariBooks.parse_toc(cc["children"], c, mx)
+                r += sr
+
+            r += "</navPoint>\n"
+
+        return r, c, mx
+
+    def create_toc(self):
+        response = self.requests_provider(urljoin(self.api_url, "toc/"))
+        if response == 0:
+            self.display.exit("API: unable to retrieve book chapters. "
+                              "Don't delete any files, just run again this program"
+                              " in order to complete the `.epub` creation!")
+
+        response = response.json()
+
+        if not isinstance(response, list) and len(response.keys()) == 1:
+            self.display.exit(
+                self.display.api_error(response) +
+                " Don't delete any files, just run again this program"
+                " in order to complete the `.epub` creation!"
+            )
+
+        navmap, _, max_depth = self.parse_toc(response)
+        return self.TOC_NCX.format(
+            (self.book_info["isbn"] if len(self.book_info["isbn"]) else self.book_id),
+            max_depth,
+            self.book_title,
+            ", ".join(aut["name"] for aut in self.book_info["authors"]),
+            navmap
+        )
+
+    def create_epub(self):
+        open(os.path.join(self.BOOK_PATH, "mimetype"), "w").write("application/epub+zip")
+        meta_info = os.path.join(self.BOOK_PATH, "META-INF")
+        if os.path.isdir(meta_info):
+            self.display.log("META-INF directory already exists: %s" % meta_info)
+
+        else:
+            os.makedirs(meta_info)
+
+        open(os.path.join(meta_info, "container.xml"), "w").write(self.CONTAINER_XML)
+        open(os.path.join(self.BOOK_PATH, "OEBPS", "content.opf"), "w").write(self.create_content_opf())
+        open(os.path.join(self.BOOK_PATH, "OEBPS", "toc.ncx"), "w").write(self.create_toc())
+
+        zip_file = os.path.join(self.BOOK_PATH, self.book_title)
+        if os.path.isfile(zip_file + ".epub"):
+            os.remove(zip_file + ".epub")
+        if os.path.isfile(zip_file + ".zip"):
+            os.remove(zip_file + ".zip")
+        shutil.make_archive(zip_file, 'zip', self.BOOK_PATH)
+        os.rename(zip_file + ".zip", zip_file + ".epub")
+
+
+# MAIN
+arguments = argparse.ArgumentParser(prog="safaribooks.py",
+                                    description="Download and generate an EPUB of your favorite books"
+                                                " from Safari Books Online.",
+                                    add_help=False,
+                                    allow_abbrev=False)
+
+arguments.add_argument(
+    "--cred", metavar="<EMAIL:PASS>", default=False,
+    help="Credentials used to perform the auth login on Safari Books Online."
+         " Es. ` --cred \"account_mail@mail.com:password01\" `."
+)
+arguments.add_argument(
+    "--no-cookies", dest="no_cookies", action='store_true',
+    help="Prevent your session data to be saved into `cookies.json` file."
+)
+arguments.add_argument(
+    "--no-kindle", dest="no_kindle", action='store_true',
+    help="Remove some CSS rules that block overflow on `table` and `pre` elements."
+         " Use this option if you're not going to export the EPUB to E-Readers like Amazon Kindle."
+)
+arguments.add_argument(
+    "--preserve-log", dest="log", action='store_true', help="Leave the `info.log` file even if there isn't any error."
+)
+arguments.add_argument("--help", action="help", default=argparse.SUPPRESS, help='Show this help message.')
+
+arguments.add_argument(
+    "bookid", metavar='<BOOK ID>',
+    help="Book digits ID that you want to download. You can find it in the URL (X-es):"
+         " `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`"
+)
+
+args_parsed = arguments.parse_args()
+
+if args_parsed.cred:
+    cred = args_parsed.cred.split(":")
+    if len(cred) != 2 or "@" not in cred[0]:
+        arguments.error("invalid credential: %s" % args_parsed.cred)
+
+    args_parsed.cred = cred
+
+else:
+    if args_parsed.no_cookies:
+        arguments.error("invalid option: `--no-cookies` is valid only if you use the `--cred` option")
+
+if not args_parsed.bookid.isdigit():
+    arguments.error("invalid book id: %s" % args_parsed.bookid)
+
+SafariBooks(args_parsed)

From ac20e8bfa29dcff10ba37be71a7373f2fb33de51 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 12 Dec 2017 16:41:52 +0100
Subject: [PATCH 013/100] Update safaribooks.py

---
 safaribooks.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 11b35e2..fc50f18 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -556,7 +556,7 @@ def get(self):
                                   (self.filename.replace(".html", ".xhtml"),
                                    " (especially because you selected the `--no-kindle` option)" if self.args.no_kindle
                                    else ""))
-                self.display.book_ad_info = 1
+                self.display.book_ad_info = 2
 
         else:
             self.save_page_html(self.parse_html(self.get_html(urljoin(self.base_url, self.filename))))
@@ -650,7 +650,7 @@ def collect_images(self):
             os.makedirs(self.images_path)
             self.display.images_ad_info.value = 1
 
-        if self.display.book_ad_info == 1:
+        if self.display.book_ad_info == 2:
             self.display.info("Some of the book contents were already downloaded.\n"
                               "    If you want to be sure that all the images will be downloaded,\n"
                               "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program.")

From 4cc96f32120a18af6ff50d1a2cc055fc04ea1b76 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 13 Dec 2017 11:31:06 +0100
Subject: [PATCH 014/100] CSS improvement: add a new rule for .bq elements

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index fc50f18..6a7a577 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -178,7 +178,7 @@ class SafariBooks:
                    "{0}\n" \
                    "<style type=\"text/css\">" \
                    "body{{background-color:#fbfbfb!important;margin:1em;}}" \
-                   "#sbo-rt-content *{{text-indent:0pt!important;}}"
+                   "#sbo-rt-content *{{text-indent:0pt!important;}}#sbo-rt-content .bq{{margin-right:1em!important;}}"
 
     KINDLE_HTML = "#sbo-rt-content *{{word-wrap:break-word!important;" \
                   "word-break:break-word!important;}}#sbo-rt-content table,#sbo-rt-content pre" \

From 503a9efebf94f0a1d2b99b7ceb02933fe5a22397 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 13 Dec 2017 15:07:33 +0100
Subject: [PATCH 015/100] EPUB Metadata improvement: add release date

---
 safaribooks.py | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 6a7a577..5dc1f79 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -110,9 +110,10 @@ def book_info(self, info):
             ("Publishers", ", ".join(pub["name"] for pub in info["publishers"])),
             ("Rights", info["rights"]),
             ("Description", description[:500] + "..." if len(description) >= 500 else description),
+            ("Release Date", info["issued"]),
             ("URL", info["web_url"])
         ]:
-            self.info("{0}: {1}".format(t[0], t[1]), True)
+            self.info("{0}{1}{2}: {3}".format(self.SH_YELLOW, t[0], self.SH_DEFAULT, t[1]), True)
 
     def state(self, origin, done):
         progress = int(done * 100 / origin)
@@ -196,7 +197,7 @@ class SafariBooks:
                     "</rootfiles>" \
                     "</container>"
 
-    # Format: ID, Title, Authors, Description, Subjects, Publisher, Rights, CoverId, MANIFEST, SPINE, CoverUrl
+    # Format: ID, Title, Authors, Description, Subjects, Publisher, Rights, Date, CoverId, MANIFEST, SPINE, CoverUrl
     CONTENT_OPF = "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n" \
                   "<package xmlns=\"http://www.idpf.org/2007/opf\" unique-identifier=\"bookid\" version=\"2.0\" >\n" \
                   "<metadata xmlns:dc=\"http://purl.org/dc/elements/1.1/\" " \
@@ -208,15 +209,16 @@ class SafariBooks:
                   "<dc:publisher>{5}</dc:publisher>\n" \
                   "<dc:rights>{6}</dc:rights>\n" \
                   "<dc:language>en-US</dc:language>\n" \
+                  "<dc:date>{7}</dc:date>" \
                   "<dc:identifier id=\"bookid\">{0}</dc:identifier>\n" \
-                  "<meta name=\"cover\" content=\"{7}\"/>\n" \
+                  "<meta name=\"cover\" content=\"{8}\"/>\n" \
                   "</metadata>\n" \
                   "<manifest>\n" \
                   "<item id=\"ncx\" href=\"toc.ncx\" media-type=\"application/x-dtbncx+xml\" />\n" \
-                  "{8}\n" \
+                  "{9}\n" \
                   "</manifest>\n" \
-                  "<spine toc=\"ncx\">\n{9}</spine>\n" \
-                  "<guide><reference href=\"{10}\" title=\"Cover\" type=\"cover\" /></guide>\n" \
+                  "<spine toc=\"ncx\">\n{10}</spine>\n" \
+                  "<guide><reference href=\"{11}\" title=\"Cover\" type=\"cover\" /></guide>\n" \
                   "</package>"
 
     # Format: ID, Depth, Title, Author, NAVMAP
@@ -704,6 +706,7 @@ def create_content_opf(self):
             subjects,
             ", ".join(escape(pub["name"]) for pub in self.book_info["publishers"]),
             escape(self.book_info["rights"]),
+            self.book_info["issued"],
             self.cover if self.cover else alt_cover_id,
             "\n".join(manifest),
             "\n".join(spine),

From 606ba4576be3905a3dd1334cbe74ce9258440652 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 13 Dec 2017 15:12:02 +0100
Subject: [PATCH 016/100] EPUB Metadata improvement: added release date

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index 5dc1f79..bf4e2cb 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -209,7 +209,7 @@ class SafariBooks:
                   "<dc:publisher>{5}</dc:publisher>\n" \
                   "<dc:rights>{6}</dc:rights>\n" \
                   "<dc:language>en-US</dc:language>\n" \
-                  "<dc:date>{7}</dc:date>" \
+                  "<dc:date>{7}</dc:date>\n" \
                   "<dc:identifier id=\"bookid\">{0}</dc:identifier>\n" \
                   "<meta name=\"cover\" content=\"{8}\"/>\n" \
                   "</metadata>\n" \

From 049e148f67fe7d9e9e13fa1e6ef7e0b3241306aa Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 13 Dec 2017 15:17:10 +0100
Subject: [PATCH 017/100] Update README.md

---
 README.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/README.md b/README.md
index a2bb2aa..f945554 100644
--- a/README.md
+++ b/README.md
@@ -101,6 +101,7 @@ optional arguments:
     [-] Publishers: O'Reilly Media, Inc.                                            
     [-] Rights: Copyright © O'Reilly Media, Inc.                                    
     [-] Description: By taking you through the development of a real web application from beginning to end, the second edition of this hands-on guide demonstrates the practical advantages of test-driven development (TDD) with Python. You’ll learn how to write and run tests before building each part of your app, and then develop the minimum amount of code required to pass those tests. The result? Clean code that works.In the process, you’ll learn the basics of Django, Selenium, Git, jQuery, and Mock, along with curre...
+    [-] Release Date: 2017-08-18
     [-] URL: https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/
     [*] Found 73 chapters!                                                          
     [*] Output directory:                                                           

From 9829ab7385d65e4d8a95ceb27233760dd43748f5 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 20 Dec 2017 11:28:17 +0100
Subject: [PATCH 018/100] Update README.md

---
 README.md | 40 ++++++++++++++++++++--------------------
 1 file changed, 20 insertions(+), 20 deletions(-)

diff --git a/README.md b/README.md
index f945554..4fbcca2 100644
--- a/README.md
+++ b/README.md
@@ -32,24 +32,10 @@ It's really simple to use, just choose a book from the library and replace in th
 $ python3 safaribooks.py --cred "account_mail@mail.com:password01" XXXXXXXXXXXXX
 ```
 
-The ID are the digits that you find in the URL of the book description page:  
+The ID is the digits that you find in the URL of the book description page:  
 `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`  
 Like: `https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/`  
   
-The first time you'll use the program, you'll have to specify your Safari Books Online account credentials. 
-For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json`.  
-  
-Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
-If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.  
-
-The program default options are thought for ensure best compatibilities for who want to export the `EPUB` to E-Readers like Amazon Kindle.  
-If you want to do it, I suggest you to convert the `EPUB` to `AZW3` with [Calibre](https://calibre-ebook.com/).  
-You can also convert the book to `MOBI` and if you'll do it with Calibre be sure to select `Ignore margins` in the conversion options:  
-  
-![Calibre IgnoreMargins](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_calibre_IgnoreMargins.png "Select Ignore margins")  
-
-In the other hand, if you're not going to export the `EPUB`, you can use the `--no-kindle` option to remove the CSS that blocks overflow on `table` and `pre` elements, see below in the examples.
-  
 #### Program options:
 ```shell
 $ python3 safaribooks.py --help
@@ -74,11 +60,24 @@ optional arguments:
   --no-kindle          Remove some CSS rules that block overflow on `table`
                        and `pre` elements. Use this option if you're not going
                        to export the EPUB to E-Readers like Amazon Kindle.
-  --preserve-log       Leave the `info.log` file even if there isn't any
-                       error.
+  --preserve-log       Leave the `info_XXXXXXXXXXXXX.log` file even if there 
+                       isn't any error.
   --help               Show this help message.
 ```
+  
+The first time you'll use the program, you'll have to specify your Safari Books Online account credentials. 
+For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json`.  
+  
+Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
+If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.  
 
+The program default options are thought for ensure best compatibilities for who want to export the `EPUB` to E-Readers like Amazon Kindle. If you want to do it, I suggest you to convert the `EPUB` to `AZW3` with [Calibre](https://calibre-ebook.com/).  
+You can also convert the book to `MOBI` and if you'll do it with Calibre be sure to select `Ignore margins` in the conversion options:  
+  
+![Calibre IgnoreMargins](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_calibre_IgnoreMargins.png "Select Ignore margins")  
+
+In the other hand, if you're not going to export the `EPUB`, you can use the `--no-kindle` option to remove the CSS that blocks overflow on `table` and `pre` elements, see below in the examples.  
+  
 ## Examples:
   * ## Download [Test-Driven Development with Python, 2nd Edition](https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/):  
     ```shell
@@ -93,7 +92,8 @@ optional arguments:
         /____/\___/\___/_/\_\/___/
 
     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
-    [-] Logging into Safari Books Online...                                         
+    [-] Logging into Safari Books Online...
+    [*] Retrieving book info... 
     [-] Title: Test-Driven Development with Python, 2nd Edition                     
     [-] Authors: Harry J.W. Percival                                                
     [-] Identifier: 9781491958698                                                   
@@ -103,10 +103,10 @@ optional arguments:
     [-] Description: By taking you through the development of a real web application from beginning to end, the second edition of this hands-on guide demonstrates the practical advantages of test-driven development (TDD) with Python. You’ll learn how to write and run tests before building each part of your app, and then develop the minimum amount of code required to pass those tests. The result? Clean code that works.In the process, you’ll learn the basics of Django, Selenium, Git, jQuery, and Mock, along with curre...
     [-] Release Date: 2017-08-18
     [-] URL: https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/
-    [*] Found 73 chapters!                                                          
+    [*] Retrieving book chapters...                                                          
     [*] Output directory:                                                           
         /XXXX/XXXX/Test-Driven Development with Python, 2nd Edition
-    [-] Downloading book contents...                                                
+    [-] Downloading book contents... (73 chapters)                                               
         [#########################################----------------------------]  60%
     ...
     [-] Creating EPUB file...                                                       

From e89ed0ac06d5caec40b2412167ffa4f747debeaa Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 20 Dec 2017 12:17:38 +0100
Subject: [PATCH 019/100] Bug fixes

---
 safaribooks.py | 89 +++++++++++++++++++++++++++++---------------------
 1 file changed, 52 insertions(+), 37 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index bf4e2cb..5fd0a37 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -5,6 +5,7 @@
 import logging
 import argparse
 import requests
+import traceback
 from lxml import html
 from html import escape
 from random import random
@@ -27,16 +28,18 @@ class Display:
     SH_BG_RED = "\033[41m"
     SH_BG_YELLOW = "\033[43m"
 
-    def __init__(self):
-        self.columns, _ = shutil.get_terminal_size()
+    def __init__(self, log_file):
+        self.log_file = os.path.join(PATH, log_file)
 
         self.logger = logging.getLogger("SafariBooks")
         self.logger.setLevel(logging.INFO)
-        logs_handler = logging.FileHandler(filename=os.path.join(PATH, "info.log"))
+        logs_handler = logging.FileHandler(filename=self.log_file)
         logs_handler.setFormatter(self.BASE_FORMAT)
         logs_handler.setLevel(logging.INFO)
         self.logger.addHandler(logs_handler)
 
+        self.columns, _ = shutil.get_terminal_size()
+
         self.logger.info("** Welcome to SafariBooks! **")
 
         self.book_ad_info = False
@@ -78,7 +81,8 @@ def exit(self, error):
         self.out(output)
         sys.exit(128)
 
-    def unhandled_exception(self, _, o, __):
+    def unhandled_exception(self, _, o, tb):
+        self.log("".join(traceback.format_tb(tb)))
         self.exit("Unhandled Exception: %s (type: %s)" % (o, o.__class__.__name__))
 
     def intro(self):
@@ -92,8 +96,11 @@ def intro(self):
     /____/\___/\___/_/\_\/___/
 """ + self.SH_DEFAULT
         output += "\n" + "~" * (self.columns // 2)
+
         self.out(output)
 
+        self.info("Retrieving book info...")
+
     def parse_description(self, desc):
         try:
             return html.fromstring(desc).text_content()
@@ -138,7 +145,7 @@ def api_error(response):
         message = "API: "
         if "detail" in response and "Not found" in response["detail"]:
             message += "book's not present in Safari Books Online.\n" \
-                       "    The book identifier are the digits that you can find in the URL:\n" \
+                       "    The book identifier is the digits that you can find in the URL:\n" \
                        "    `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`"
 
         else:
@@ -239,7 +246,7 @@ class SafariBooks:
 
     def __init__(self, args):
         self.args = args
-        self.display = Display()
+        self.display = Display("info_%s.log" % escape(args.bookid))
         self.display.intro()
 
         self.cookies = {}
@@ -261,10 +268,14 @@ def __init__(self, args):
         self.api_url = self.API_TEMPLATE.format(self.book_id)
         self.book_info = self.get_book_info()
         self.display.book_info(self.book_info)
+
+        self.display.info("Retrieving book chapters...")
         self.book_chapters = self.get_book_chapters()
-        self.display.info("Found %s chapters!" % len(self.book_chapters))
         self.chapters_queue = self.book_chapters[:]
 
+        if len(self.book_chapters) > sys.getrecursionlimit():
+            sys.setrecursionlimit(len(self.book_chapters))
+
         self.book_title = self.book_info["title"]
         self.base_url = self.book_info["web_url"]
 
@@ -277,7 +288,7 @@ def __init__(self, args):
         self.css = []
         self.images = []
 
-        self.display.info("Downloading book contents...", state=True)
+        self.display.info("Downloading book contents... (%s chapters)" % len(self.book_chapters), state=True)
         self.BASE_HTML = self.BASE_01_HTML + (self.KINDLE_HTML if not args.no_kindle else "") + self.BASE_02_HTML
         self.get()
 
@@ -285,9 +296,9 @@ def __init__(self, args):
         self.images_path = ""
         self.cover = ""
 
-        self.display.info("Downloading book CSSs...", state=True)
+        self.display.info("Downloading book CSSs... (%s files)" % len(self.css), state=True)
         self.collect_css()
-        self.display.info("Downloading book images...", state=True)
+        self.display.info("Downloading book images... (%s files)" % len(self.images), state=True)
         self.collect_images()
 
         self.display.info("Creating EPUB file...", state=True)
@@ -299,7 +310,7 @@ def __init__(self, args):
         self.display.done(self.book_title + ".epub")
 
         if not self.display.in_error and not args.log:
-            os.remove(os.path.join(PATH, "info.log"))
+            os.remove(self.display.log_file)
 
         sys.exit(0)
 
@@ -420,6 +431,9 @@ def get_book_chapters(self, page=0):
         if "results" not in response or not len(response["results"]):
             self.display.exit("API: unable to retrieve book chapters.")
 
+        if response["count"] > sys.getrecursionlimit():
+            sys.setrecursionlimit(response["count"])
+
         result = []
         result.extend([c for c in response["results"] if "cover." in c["filename"]])
         for c in result:
@@ -452,8 +466,10 @@ def get_html(self, url):
     def link_replace(self, link):
         if link[0] == "/" and ("cover" in link or "images" in link or "graphics" in link
                                or link[-3:] in ["jpg", "jpeg", "png"]):
-            self.images.append(link)
-            self.display.log("Crawler: found a new image at %s" % link)
+            if link not in self.images:
+                self.images.append(link)
+                self.display.log("Crawler: found a new image at %s" % link)
+
             image = link.split("/")[-1]
             return "Images/" + image
 
@@ -542,29 +558,31 @@ def save_page_html(self, contents):
         self.display.log("Created: %s" % self.filename)
 
     def get(self):
-        if not len(self.chapters_queue):
-            return
+        len_books = len(self.book_chapters)
 
-        next_chapter = self.chapters_queue.pop(0)
-        self.chapter_title = next_chapter["title"]
-        self.filename = next_chapter["filename"]
+        for _ in self.book_chapters:
+            if not len(self.chapters_queue):
+                return
 
-        if os.path.isfile(os.path.join(self.BOOK_PATH, "OEBPS", self.filename.replace(".html", ".xhtml"))):
-            if not self.display.book_ad_info and \
-                    next_chapter not in self.book_chapters[:self.book_chapters.index(next_chapter)]:
-                self.display.info("File `%s` already exists.\n"
-                                  "    If you want to download again all the book%s,\n"
-                                  "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program." %
-                                  (self.filename.replace(".html", ".xhtml"),
-                                   " (especially because you selected the `--no-kindle` option)" if self.args.no_kindle
-                                   else ""))
-                self.display.book_ad_info = 2
+            next_chapter = self.chapters_queue.pop(0)
+            self.chapter_title = next_chapter["title"]
+            self.filename = next_chapter["filename"]
 
-        else:
-            self.save_page_html(self.parse_html(self.get_html(urljoin(self.base_url, self.filename))))
+            if os.path.isfile(os.path.join(self.BOOK_PATH, "OEBPS", self.filename.replace(".html", ".xhtml"))):
+                if not self.display.book_ad_info and \
+                        next_chapter not in self.book_chapters[:self.book_chapters.index(next_chapter)]:
+                    self.display.info("File `%s` already exists.\n"
+                                      "    If you want to download again all the book%s,\n"
+                                      "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program." %
+                                      (self.filename.replace(".html", ".xhtml"),
+                                       " (especially because you selected the `--no-kindle` option)" if self.args.no_kindle
+                                       else ""))
+                    self.display.book_ad_info = 2
 
-        self.display.state(len(self.book_chapters), len(self.book_chapters) - len(self.chapters_queue))
-        self.get()
+            else:
+                self.save_page_html(self.parse_html(self.get_html(urljoin(self.base_url, self.filename))))
+
+            self.display.state(len_books, len_books - len(self.chapters_queue))
 
     def _thread_download_css(self, url, done_queue):
         css_file = os.path.join(self.css_path, "Style{0:0>2}.css".format(self.css.index(url)))
@@ -805,10 +823,10 @@ def create_epub(self):
          " Use this option if you're not going to export the EPUB to E-Readers like Amazon Kindle."
 )
 arguments.add_argument(
-    "--preserve-log", dest="log", action='store_true', help="Leave the `info.log` file even if there isn't any error."
+    "--preserve-log", dest="log", action='store_true', help="Leave the `info_XXXXXXXXXXXXX.log`"
+                                                            " file even if there isn't any error."
 )
 arguments.add_argument("--help", action="help", default=argparse.SUPPRESS, help='Show this help message.')
-
 arguments.add_argument(
     "bookid", metavar='<BOOK ID>',
     help="Book digits ID that you want to download. You can find it in the URL (X-es):"
@@ -828,7 +846,4 @@ def create_epub(self):
     if args_parsed.no_cookies:
         arguments.error("invalid option: `--no-cookies` is valid only if you use the `--cred` option")
 
-if not args_parsed.bookid.isdigit():
-    arguments.error("invalid book id: %s" % args_parsed.bookid)
-
 SafariBooks(args_parsed)

From 8e58852156ed7d62e26ea7aeeef10edce040a40c Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 28 Dec 2017 16:59:27 +0100
Subject: [PATCH 020/100] Fixes #1

---
 safaribooks.py | 84 +++++++++++++++++++++++++++++++++-----------------
 1 file changed, 55 insertions(+), 29 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 5fd0a37..315dd08 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -1,3 +1,4 @@
+# coding: utf-8
 import os
 import sys
 import json
@@ -23,10 +24,10 @@ class Display:
         datefmt="%d/%b/%Y %H:%M:%S"
     )
 
-    SH_DEFAULT = "\033[0m"
-    SH_YELLOW = "\033[33m"
-    SH_BG_RED = "\033[41m"
-    SH_BG_YELLOW = "\033[43m"
+    SH_DEFAULT = "\033[0m" if "win" not in sys.platform else ""  # TODO colors for Windows
+    SH_YELLOW = "\033[33m" if "win" not in sys.platform else ""
+    SH_BG_RED = "\033[41m" if "win" not in sys.platform else ""
+    SH_BG_YELLOW = "\033[43m" if "win" not in sys.platform else ""
 
     def __init__(self, log_file):
         self.log_file = os.path.join(PATH, log_file)
@@ -99,8 +100,6 @@ def intro(self):
 
         self.out(output)
 
-        self.info("Retrieving book info...")
-
     def parse_description(self, desc):
         try:
             return html.fromstring(desc).text_content()
@@ -157,6 +156,14 @@ def api_error(response):
         return message
 
 
+class WinQueue(list):  # TODO: error while use Process in Windows: can't pickle _thread.RLock objects
+    def put(self, el):
+        self.append(el)
+
+    def qsize(self):
+        return self.__len__()
+
+
 class SafariBooks:
 
     HEADERS = {
@@ -266,6 +273,8 @@ def __init__(self, args):
 
         self.book_id = args.bookid
         self.api_url = self.API_TEMPLATE.format(self.book_id)
+
+        self.display.info("Retrieving book info...")
         self.book_info = self.get_book_info()
         self.display.book_info(self.book_info)
 
@@ -296,8 +305,10 @@ def __init__(self, args):
         self.images_path = ""
         self.cover = ""
 
+        self.css_done_queue = Queue(0) if "win" not in sys.platform else WinQueue()
         self.display.info("Downloading book CSSs... (%s files)" % len(self.css), state=True)
         self.collect_css()
+        self.images_done_queue = Queue(0) if "win" not in sys.platform else WinQueue()
         self.display.info("Downloading book images... (%s files)" % len(self.images), state=True)
         self.collect_images()
 
@@ -465,7 +476,7 @@ def get_html(self, url):
 
     def link_replace(self, link):
         if link[0] == "/" and ("cover" in link or "images" in link or "graphics" in link
-                               or link[-3:] in ["jpg", "jpeg", "png"]):
+                               or link[-3:] in ["jpg", "peg", "png", "gif"]):
             if link not in self.images:
                 self.images.append(link)
                 self.display.log("Crawler: found a new image at %s" % link)
@@ -553,8 +564,8 @@ def create_dirs(self):
 
     def save_page_html(self, contents):
         self.filename = self.filename.replace(".html", ".xhtml")
-        open(os.path.join(self.BOOK_PATH, "OEBPS", self.filename), "w")\
-            .write(self.BASE_HTML.format(contents[0], contents[1]))
+        open(os.path.join(self.BOOK_PATH, "OEBPS", self.filename), "wb")\
+            .write(self.BASE_HTML.format(contents[0], contents[1]).encode("utf-8", "replace"))
         self.display.log("Created: %s" % self.filename)
 
     def get(self):
@@ -571,12 +582,16 @@ def get(self):
             if os.path.isfile(os.path.join(self.BOOK_PATH, "OEBPS", self.filename.replace(".html", ".xhtml"))):
                 if not self.display.book_ad_info and \
                         next_chapter not in self.book_chapters[:self.book_chapters.index(next_chapter)]:
-                    self.display.info("File `%s` already exists.\n"
-                                      "    If you want to download again all the book%s,\n"
-                                      "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program." %
-                                      (self.filename.replace(".html", ".xhtml"),
-                                       " (especially because you selected the `--no-kindle` option)" if self.args.no_kindle
-                                       else ""))
+                    self.display.info(
+                        "File `%s` already exists.\n"
+                        "    If you want to download again all the book%s,\n"
+                        "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program." %
+                        (
+                            self.filename.replace(".html", ".xhtml"),
+                            " (especially because you selected the `--no-kindle` option)"
+                            if self.args.no_kindle else ""
+                        )
+                    )
                     self.display.book_ad_info = 2
 
             else:
@@ -584,7 +599,7 @@ def get(self):
 
             self.display.state(len_books, len_books - len(self.chapters_queue))
 
-    def _thread_download_css(self, url, done_queue):
+    def _thread_download_css(self, url):
         css_file = os.path.join(self.css_path, "Style{0:0>2}.css".format(self.css.index(url)))
         if os.path.isfile(css_file):
             if not self.display.css_ad_info.value and url not in self.css[:self.css.index(url)]:
@@ -604,10 +619,10 @@ def _thread_download_css(self, url, done_queue):
                 for chunk in response.iter_content(1024):
                     s.write(chunk)
 
-        done_queue.put(1)
-        self.display.state(len(self.css), done_queue.qsize())
+        self.css_done_queue.put(1)
+        self.display.state(len(self.css), self.css_done_queue.qsize())
 
-    def _thread_download_images(self, url, done_queue):
+    def _thread_download_images(self, url):
         image_name = url.split("/")[-1]
         image_path = os.path.join(self.images_path, image_name)
         if os.path.isfile(image_path):
@@ -630,19 +645,16 @@ def _thread_download_images(self, url, done_queue):
                 for chunk in response.iter_content(1024):
                     img.write(chunk)
 
-        done_queue.put(1)
-        self.display.state(len(self.images), done_queue.qsize())
-
-    def _start_multiprocessing(self, operation, full_queue, done_queue=None):
-        if not done_queue:
-            done_queue = Queue(0)
+        self.images_done_queue.put(1)
+        self.display.state(len(self.images), self.images_done_queue.qsize())
 
+    def _start_multiprocessing(self, operation, full_queue):
         if len(full_queue) > 5:
             for i in range(0, len(full_queue), 5):
-                self._start_multiprocessing(operation, full_queue[i:i+5], done_queue)
+                self._start_multiprocessing(operation, full_queue[i:i+5])
 
         else:
-            process_queue = [Process(target=operation, args=(arg, done_queue)) for arg in full_queue]
+            process_queue = [Process(target=operation, args=(arg,)) for arg in full_queue]
             for proc in process_queue:
                 proc.start()
 
@@ -659,7 +671,14 @@ def collect_css(self):
             self.display.css_ad_info.value = 1
 
         self.display.state_status.value = -1
-        self._start_multiprocessing(self._thread_download_css, self.css)
+
+        if "win" in sys.platform:
+            # TODO
+            for css_url in self.css:
+                self._thread_download_css(css_url)
+
+        else:
+            self._start_multiprocessing(self._thread_download_css, self.css)
 
     def collect_images(self):
         self.images_path = os.path.join(self.BOOK_PATH, "OEBPS", "Images")
@@ -676,7 +695,14 @@ def collect_images(self):
                               "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program.")
 
         self.display.state_status.value = -1
-        self._start_multiprocessing(self._thread_download_images, self.images)
+
+        if "win" in sys.platform:
+            # TODO
+            for image_url in self.images:
+                self._thread_download_images(image_url)
+
+        else:
+            self._start_multiprocessing(self._thread_download_images, self.images)
 
     def create_content_opf(self):
         self.cover = self.images[0] if len(self.images) else ""

From acaf2828368633a75f4fbe9b29ef3ba1f050b244 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 15 Jan 2018 11:26:30 +0100
Subject: [PATCH 021/100] Bug fix for `link_replace` empty arg

---
 safaribooks.py | 20 +++++++++++---------
 1 file changed, 11 insertions(+), 9 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 315dd08..b584e2f 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -475,17 +475,19 @@ def get_html(self, url):
         return root
 
     def link_replace(self, link):
-        if link[0] == "/" and ("cover" in link or "images" in link or "graphics" in link
-                               or link[-3:] in ["jpg", "peg", "png", "gif"]):
-            if link not in self.images:
-                self.images.append(link)
-                self.display.log("Crawler: found a new image at %s" % link)
+        if link:
 
-            image = link.split("/")[-1]
-            return "Images/" + image
+            if link[0] == "/" and ("cover" in link or "images" in link or "graphics" in link
+                                   or link[-3:] in ["jpg", "peg", "png", "gif"]):
+                if link not in self.images:
+                    self.images.append(link)
+                    self.display.log("Crawler: found a new image at %s" % link)
 
-        elif link[0] not in ["/", "h"]:
-            return link.replace(".html", ".xhtml")
+                image = link.split("/")[-1]
+                return "Images/" + image
+
+            elif link[0] not in ["/", "h"]:
+                return link.replace(".html", ".xhtml")
 
         return link
 

From cbcd9bb51e98787871355fd2bd98c49e70445bef Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 2 Feb 2018 11:43:56 +0100
Subject: [PATCH 022/100] Update: fixed some bug and added `svg` link replace

---
 safaribooks.py | 56 ++++++++++++++++++++++++++++++++------------------
 1 file changed, 36 insertions(+), 20 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index b584e2f..523bf53 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -10,7 +10,7 @@
 from lxml import html
 from html import escape
 from random import random
-from urllib.parse import urljoin, urlsplit
+from urllib.parse import urljoin, urlsplit, urlparse
 from multiprocessing import Process, Queue, Value
 
 
@@ -24,7 +24,7 @@ class Display:
         datefmt="%d/%b/%Y %H:%M:%S"
     )
 
-    SH_DEFAULT = "\033[0m" if "win" not in sys.platform else ""  # TODO colors for Windows
+    SH_DEFAULT = "\033[0m" if "win" not in sys.platform else ""  # TODO: colors for Windows
     SH_YELLOW = "\033[33m" if "win" not in sys.platform else ""
     SH_BG_RED = "\033[41m" if "win" not in sys.platform else ""
     SH_BG_YELLOW = "\033[43m" if "win" not in sys.platform else ""
@@ -282,13 +282,10 @@ def __init__(self, args):
         self.book_chapters = self.get_book_chapters()
         self.chapters_queue = self.book_chapters[:]
 
-        if len(self.book_chapters) > sys.getrecursionlimit():
-            sys.setrecursionlimit(len(self.book_chapters))
-
         self.book_title = self.book_info["title"]
         self.base_url = self.book_info["web_url"]
 
-        self.BOOK_PATH = os.path.join(PATH, self.book_title)
+        self.BOOK_PATH = os.path.join(PATH, "Books", self.book_title)
         self.create_dirs()
         self.display.info("Output directory:\n    %s" % self.BOOK_PATH)
 
@@ -442,9 +439,6 @@ def get_book_chapters(self, page=0):
         if "results" not in response or not len(response["results"]):
             self.display.exit("API: unable to retrieve book chapters.")
 
-        if response["count"] > sys.getrecursionlimit():
-            sys.setrecursionlimit(response["count"])
-
         result = []
         result.extend([c for c in response["results"] if "cover." in c["filename"]])
         for c in result:
@@ -474,24 +468,28 @@ def get_html(self, url):
 
         return root
 
+    @staticmethod
+    def url_is_absolute(url):
+        return bool(urlparse(url).netloc)
+
     def link_replace(self, link):
         if link:
+            if not self.url_is_absolute(link):
+                link = urljoin(self.base_url, link)
+                if "cover" in link or "images" in link or "graphics" in link or \
+                        link[-3:] in ["jpg", "peg", "png", "gif"]:
+                    if link not in self.images:
+                        self.images.append(link)
+                        self.display.log("Crawler: found a new image at %s" % link)
 
-            if link[0] == "/" and ("cover" in link or "images" in link or "graphics" in link
-                                   or link[-3:] in ["jpg", "peg", "png", "gif"]):
-                if link not in self.images:
-                    self.images.append(link)
-                    self.display.log("Crawler: found a new image at %s" % link)
+                    image = link.split("/")[-1]
+                    return "Images/" + image
 
-                image = link.split("/")[-1]
-                return "Images/" + image
-
-            elif link[0] not in ["/", "h"]:
                 return link.replace(".html", ".xhtml")
 
         return link
 
-    def parse_html(self, root):
+    def parse_html(self, root, is_cover=False):
         if random() > 0.5:
             if len(root.xpath("//div[@class='controls']/a/text()")):
                 self.display.exit(self.display.api_error(" "))
@@ -536,9 +534,25 @@ def parse_html(self, root):
                         (self.filename, self.chapter_title)
                     )
 
+        if is_cover:
+            page_css += "<style>img,image{height:100%;width:100%;}</style>"
+
         book_content = book_content[0]
         book_content.rewrite_links(self.link_replace)
 
+        # TODO: add all not covered tag for `link_replace` function
+        svg_image_tags = root.xpath("//image")
+        if len(svg_image_tags):
+            for img in svg_image_tags:
+                image_attr_href = [x for x in img.attrib.keys() if "href" in x]
+                if len(image_attr_href):
+                    svg_url = img.attrib.get(image_attr_href[0])
+                    svg_root = img.getparent().getparent()
+                    new_img = svg_root.makeelement("img")
+                    new_img.attrib.update({"src": self.link_replace(svg_url)})
+                    svg_root.remove(img.getparent())
+                    svg_root.append(new_img)
+
         xhtml = None
         try:
             xhtml = html.tostring(book_content, method="xml", encoding='unicode')
@@ -577,6 +591,8 @@ def get(self):
             if not len(self.chapters_queue):
                 return
 
+            is_cover = len_books == len(self.chapters_queue)
+
             next_chapter = self.chapters_queue.pop(0)
             self.chapter_title = next_chapter["title"]
             self.filename = next_chapter["filename"]
@@ -597,7 +613,7 @@ def get(self):
                     self.display.book_ad_info = 2
 
             else:
-                self.save_page_html(self.parse_html(self.get_html(urljoin(self.base_url, self.filename))))
+                self.save_page_html(self.parse_html(self.get_html(urljoin(self.base_url, self.filename)), is_cover))
 
             self.display.state(len_books, len_books - len(self.chapters_queue))
 

From e90c0a9faa9a14f7f5ff6bd2285f29b89c301139 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 2 Feb 2018 12:14:36 +0100
Subject: [PATCH 023/100] Update: bug fix

---
 safaribooks.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/safaribooks.py b/safaribooks.py
index 523bf53..2d98035 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -282,6 +282,9 @@ def __init__(self, args):
         self.book_chapters = self.get_book_chapters()
         self.chapters_queue = self.book_chapters[:]
 
+        if len(self.book_chapters) > sys.getrecursionlimit():
+            sys.setrecursionlimit(len(self.book_chapters))
+
         self.book_title = self.book_info["title"]
         self.base_url = self.book_info["web_url"]
 
@@ -439,6 +442,9 @@ def get_book_chapters(self, page=0):
         if "results" not in response or not len(response["results"]):
             self.display.exit("API: unable to retrieve book chapters.")
 
+        if response["count"] > sys.getrecursionlimit():
+            sys.setrecursionlimit(response["count"])
+
         result = []
         result.extend([c for c in response["results"] if "cover." in c["filename"]])
         for c in result:

From 5caf9768d8f43f438d2e66dcc03864c4a6234c84 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 2 Feb 2018 12:22:15 +0100
Subject: [PATCH 024/100] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 4fbcca2..8301c16 100644
--- a/README.md
+++ b/README.md
@@ -105,7 +105,7 @@ In the other hand, if you're not going to export the `EPUB`, you can use the `--
     [-] URL: https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/
     [*] Retrieving book chapters...                                                          
     [*] Output directory:                                                           
-        /XXXX/XXXX/Test-Driven Development with Python, 2nd Edition
+        /XXXX/XXXX/Books/Test-Driven Development with Python, 2nd Edition
     [-] Downloading book contents... (73 chapters)                                               
         [#########################################----------------------------]  60%
     ...

From 0c9aab6b33739588cf1ed89be61be776223fe237 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 20 Feb 2018 19:43:19 +0100
Subject: [PATCH 025/100] Update README.md

---
 README.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 8301c16..7da2323 100644
--- a/README.md
+++ b/README.md
@@ -1,5 +1,5 @@
 # SafariBooks
-Download and generate an *EPUB* of your favorite books from [*Safari Books Online*](https://www.safaribooksonline.com) library.  
+Download and generate *EPUB* of your favorite books from [*Safari Books Online*](https://www.safaribooksonline.com) library.  
 Use this program only for *personal* and/or *educational* purpose.  
 
 ## Overview:
@@ -43,7 +43,7 @@ usage: safaribooks.py [--cred <EMAIL:PASS>] [--no-cookies] [--no-kindle]
                       [--preserve-log] [--help]
                       <BOOK ID>
 
-Download and generate an EPUB of your favorite books from Safari Books Online.
+Download and generate EPUB of your favorite books from Safari Books Online.
 
 positional arguments:
   <BOOK ID>            Book digits ID that you want to download.

From cdb96d6fcec769b0bbe3bc13e1e1abf67961dffb Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 22 Feb 2018 17:01:24 +0100
Subject: [PATCH 026/100] Update README.md

Fixes #2
---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 7da2323..430d81f 100644
--- a/README.md
+++ b/README.md
@@ -66,7 +66,7 @@ optional arguments:
 ```
   
 The first time you'll use the program, you'll have to specify your Safari Books Online account credentials. 
-For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json`.  
+For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json` (see file format [`here`](/../../issues/2)). 
   
 Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
 If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.  

From a9f1eb71a0dee6bedf6999140c9bb8174a232dcf Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 22 Feb 2018 17:03:20 +0100
Subject: [PATCH 027/100] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 430d81f..0700f36 100644
--- a/README.md
+++ b/README.md
@@ -66,7 +66,7 @@ optional arguments:
 ```
   
 The first time you'll use the program, you'll have to specify your Safari Books Online account credentials. 
-For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json` (see file format [`here`](/../../issues/2)). 
+For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json` (see file format [`here`](/../../issues/2#issuecomment-367726544)). 
   
 Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
 If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.  

From f38eeb67486017e11cc25181a13c49407a4171ce Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 23 Feb 2018 18:06:57 +0100
Subject: [PATCH 028/100] Fixed #4

---
 safaribooks.py | 25 ++++++++++++++++++++-----
 1 file changed, 20 insertions(+), 5 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 2d98035..6613b00 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -1,3 +1,4 @@
+#!/usr/bin/env python3
 # coding: utf-8
 import os
 import sys
@@ -10,8 +11,8 @@
 from lxml import html
 from html import escape
 from random import random
-from urllib.parse import urljoin, urlsplit, urlparse
 from multiprocessing import Process, Queue, Value
+from urllib.parse import urljoin, urlsplit, urlparse
 
 
 PATH = os.path.dirname(os.path.realpath(__file__))
@@ -288,7 +289,8 @@ def __init__(self, args):
         self.book_title = self.book_info["title"]
         self.base_url = self.book_info["web_url"]
 
-        self.BOOK_PATH = os.path.join(PATH, "Books", self.book_title)
+        self.clean_book_title = self.clean_dirname(self.book_title)
+        self.BOOK_PATH = os.path.join(PATH, "Books", self.clean_book_title)
         self.create_dirs()
         self.display.info("Output directory:\n    %s" % self.BOOK_PATH)
 
@@ -318,7 +320,7 @@ def __init__(self, args):
         if not args.no_cookies:
             json.dump(self.cookies, open(COOKIES_FILE, "w"))
 
-        self.display.done(self.book_title + ".epub")
+        self.display.done(self.clean_book_title + ".epub")
 
         if not self.display.in_error and not args.log:
             os.remove(self.display.log_file)
@@ -572,6 +574,18 @@ def parse_html(self, root, is_cover=False):
 
         return page_css, xhtml
 
+    @staticmethod
+    def clean_dirname(dirname):
+        if ":" in dirname:
+            if dirname.index(":") > 45:
+                dirname = dirname.split(":")[0]
+
+        for ch in ['\\', '/', '<', '>', '`', '\'', '"', '*', '?', ':', '|']:
+            if ch in dirname:
+                dirname = dirname.replace(ch, "_")
+
+        return dirname
+
     def create_dirs(self):
         if os.path.isdir(self.BOOK_PATH):
             self.display.log("Book directory already exists: %s" % self.book_title)
@@ -842,13 +856,14 @@ def create_epub(self):
         open(os.path.join(self.BOOK_PATH, "OEBPS", "content.opf"), "w").write(self.create_content_opf())
         open(os.path.join(self.BOOK_PATH, "OEBPS", "toc.ncx"), "w").write(self.create_toc())
 
-        zip_file = os.path.join(self.BOOK_PATH, self.book_title)
+        zip_file = os.path.join(PATH, "Books", self.book_id)
         if os.path.isfile(zip_file + ".epub"):
             os.remove(zip_file + ".epub")
         if os.path.isfile(zip_file + ".zip"):
             os.remove(zip_file + ".zip")
+
         shutil.make_archive(zip_file, 'zip', self.BOOK_PATH)
-        os.rename(zip_file + ".zip", zip_file + ".epub")
+        os.rename(zip_file + ".zip", os.path.join(self.BOOK_PATH, self.clean_book_title) + ".epub")
 
 
 # MAIN

From 3458e4b98a8dc903cff389ffea415de4f9901941 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 23 Feb 2018 18:11:26 +0100
Subject: [PATCH 029/100] Update safaribooks.py

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index 6613b00..cffd72a 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -580,7 +580,7 @@ def clean_dirname(dirname):
             if dirname.index(":") > 45:
                 dirname = dirname.split(":")[0]
 
-        for ch in ['\\', '/', '<', '>', '`', '\'', '"', '*', '?', ':', '|']:
+        for ch in ['\\', '/', '<', '>', '`', '\'', '"', '*', '?', '|']:
             if ch in dirname:
                 dirname = dirname.replace(ch, "_")
 

From 67b3e11d26f97b773056bab6df2aa18ae85de7c7 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Sun, 25 Feb 2018 19:10:16 +0100
Subject: [PATCH 030/100] Added verbosity at debug log Fixed #3

---
 safaribooks.py | 27 ++++++++++++++++++++++-----
 1 file changed, 22 insertions(+), 5 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index cffd72a..6535bbd 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -47,6 +47,7 @@ def __init__(self, log_file):
         self.book_ad_info = False
         self.css_ad_info = Value("i", 0)
         self.images_ad_info = Value("i", 0)
+        self.last_request = (None,)
         self.in_error = False
 
         self.state_status = Value("i", 0)
@@ -85,6 +86,10 @@ def exit(self, error):
 
     def unhandled_exception(self, _, o, tb):
         self.log("".join(traceback.format_tb(tb)))
+        if any(self.last_request):
+            self.log("Last request done:\n\tURL: {0}\n\tDATA: {1}\n\tOTHERS: {2}\n\n\t{3}\n{4}\n\n{5}\n"
+                     .format(*self.last_request))
+
         self.exit("Unhandled Exception: %s (type: %s)" % (o, o.__class__.__name__))
 
     def intro(self):
@@ -354,6 +359,12 @@ def requests_provider(self, url, post=False, data=None, update_cookies=True, **k
                 **kwargs
             )
 
+            self.display.last_request = (
+                url, data, kwargs, response.status_code, "\n".join(
+                    ["\t{}: {}".format(*h) for h in response.headers.items()]
+                ), response.text
+            )
+
         except (requests.ConnectionError, requests.ConnectTimeout, requests.RequestException) as request_exception:
             self.display.error(str(request_exception))
             return 0
@@ -577,7 +588,7 @@ def parse_html(self, root, is_cover=False):
     @staticmethod
     def clean_dirname(dirname):
         if ":" in dirname:
-            if dirname.index(":") > 45:
+            if dirname.index(":") > 30:
                 dirname = dirname.split(":")[0]
 
         for ch in ['\\', '/', '<', '>', '`', '\'', '"', '*', '?', '|']:
@@ -601,7 +612,7 @@ def create_dirs(self):
     def save_page_html(self, contents):
         self.filename = self.filename.replace(".html", ".xhtml")
         open(os.path.join(self.BOOK_PATH, "OEBPS", self.filename), "wb")\
-            .write(self.BASE_HTML.format(contents[0], contents[1]).encode("utf-8", "replace"))
+            .write(self.BASE_HTML.format(contents[0], contents[1]).encode("utf-8", 'xmlcharrefreplace'))
         self.display.log("Created: %s" % self.filename)
 
     def get(self):
@@ -852,9 +863,15 @@ def create_epub(self):
         else:
             os.makedirs(meta_info)
 
-        open(os.path.join(meta_info, "container.xml"), "w").write(self.CONTAINER_XML)
-        open(os.path.join(self.BOOK_PATH, "OEBPS", "content.opf"), "w").write(self.create_content_opf())
-        open(os.path.join(self.BOOK_PATH, "OEBPS", "toc.ncx"), "w").write(self.create_toc())
+        open(os.path.join(meta_info, "container.xml"), "wb").write(
+            self.CONTAINER_XML.encode("utf-8", "xmlcharrefreplace")
+        )
+        open(os.path.join(self.BOOK_PATH, "OEBPS", "content.opf"), "wb").write(
+            self.create_content_opf().encode("utf-8", "xmlcharrefreplace")
+        )
+        open(os.path.join(self.BOOK_PATH, "OEBPS", "toc.ncx"), "wb").write(
+            self.create_toc().encode("utf-8", "xmlcharrefreplace")
+        )
 
         zip_file = os.path.join(PATH, "Books", self.book_id)
         if os.path.isfile(zip_file + ".epub"):

From cfad39c38229c384580f74d53d46b51ac03ce647 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 26 Feb 2018 20:13:10 +0100
Subject: [PATCH 031/100] Updated and fixed #3

---
 safaribooks.py | 79 +++++++++++++++++++++++++++++++++++++++-----------
 1 file changed, 62 insertions(+), 17 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 6535bbd..97ca52b 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -82,16 +82,19 @@ def exit(self, error):
 
         output = self.SH_BG_RED + "[!]" + self.SH_DEFAULT + " Aborting..."
         self.out(output)
+
+        self.save_last_request()
         sys.exit(128)
 
     def unhandled_exception(self, _, o, tb):
         self.log("".join(traceback.format_tb(tb)))
+        self.exit("Unhandled Exception: %s (type: %s)" % (o, o.__class__.__name__))
+
+    def save_last_request(self):
         if any(self.last_request):
             self.log("Last request done:\n\tURL: {0}\n\tDATA: {1}\n\tOTHERS: {2}\n\n\t{3}\n{4}\n\n{5}\n"
                      .format(*self.last_request))
 
-        self.exit("Unhandled Exception: %s (type: %s)" % (o, o.__class__.__name__))
-
     def intro(self):
         output = self.SH_YELLOW + """
        ____     ___         _ 
@@ -286,6 +289,16 @@ def __init__(self, args):
 
         self.display.info("Retrieving book chapters...")
         self.book_chapters = self.get_book_chapters()
+
+        self.no_cover = False
+        if "cover" not in self.book_chapters[0]["filename"] or "cover" not in self.book_chapters[0]["title"]:
+            self.book_chapters = [{
+                "filename": "cover",
+                "title": "Cover",
+                "web_url": self.book_info["cover"]
+            }] + self.book_chapters
+            self.no_cover = True
+
         self.chapters_queue = self.book_chapters[:]
 
         if len(self.book_chapters) > sys.getrecursionlimit():
@@ -306,6 +319,7 @@ def __init__(self, args):
 
         self.display.info("Downloading book contents... (%s chapters)" % len(self.book_chapters), state=True)
         self.BASE_HTML = self.BASE_01_HTML + (self.KINDLE_HTML if not args.no_kindle else "") + self.BASE_02_HTML
+
         self.get()
 
         self.css_path = ""
@@ -442,8 +456,8 @@ def get_book_info(self):
 
         return response
 
-    def get_book_chapters(self, page=0):
-        response = self.requests_provider(urljoin(self.api_url, "chapter/" + ("" if not page else "?page=%s" % page)))
+    def get_book_chapters(self, page=1):
+        response = self.requests_provider(urljoin(self.api_url, "chapter/?page=%s" % page))
         if response == 0:
             self.display.exit("API: unable to retrieve book chapters.")
 
@@ -463,7 +477,7 @@ def get_book_chapters(self, page=0):
         for c in result:
             del response["results"][response["results"].index(c)]
 
-        result += response["results"]   
+        result += response["results"]
         return result + (self.get_book_chapters(page + 1) if response["next"] else [])
 
     def get_html(self, url):
@@ -532,9 +546,9 @@ def parse_html(self, root, is_cover=False):
                     self.css.append(css_url)
                     self.display.log("Crawler: found a new CSS at %s" % css_url)
 
-                stylesheet_count += 1
                 page_css += "<link href=\"Styles/Style{0:0>2}.css\" " \
                             "rel=\"stylesheet\" type=\"text/css\" />\n".format(stylesheet_count)
+                stylesheet_count += 1
 
         stylesheets = root.xpath("//style")
         if len(stylesheets):
@@ -553,12 +567,6 @@ def parse_html(self, root, is_cover=False):
                         (self.filename, self.chapter_title)
                     )
 
-        if is_cover:
-            page_css += "<style>img,image{height:100%;width:100%;}</style>"
-
-        book_content = book_content[0]
-        book_content.rewrite_links(self.link_replace)
-
         # TODO: add all not covered tag for `link_replace` function
         svg_image_tags = root.xpath("//image")
         if len(svg_image_tags):
@@ -568,12 +576,31 @@ def parse_html(self, root, is_cover=False):
                     svg_url = img.attrib.get(image_attr_href[0])
                     svg_root = img.getparent().getparent()
                     new_img = svg_root.makeelement("img")
-                    new_img.attrib.update({"src": self.link_replace(svg_url)})
+                    new_img.attrib.update({"src": svg_url})
                     svg_root.remove(img.getparent())
                     svg_root.append(new_img)
 
+        book_content = book_content[0]
+        book_content.rewrite_links(self.link_replace)
+
         xhtml = None
         try:
+            if is_cover:
+                page_css = "<style>" \
+                           "body{display:table;position:absolute;margin:0!important;height:100%;width:100%;}" \
+                           "#Cover{display:table-cell;vertical-align:middle;text-align:center;}" \
+                           "img{height:90vh;margin-left:auto;margin-right:auto;}" \
+                           "</style>"
+
+                cover_html = html.fromstring("<div id=\"Cover\"></div>")
+                cover_div = cover_html.xpath("//div")[0]
+
+                if len(book_content.xpath("//img")):
+                    cover_img = cover_div.makeelement("img")
+                    cover_img.attrib.update({"src": book_content.xpath("//img")[0].attrib["src"]})
+                    cover_div.append(cover_img)
+                    book_content = cover_html
+
             xhtml = html.tostring(book_content, method="xml", encoding='unicode')
 
         except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
@@ -644,7 +671,25 @@ def get(self):
                     self.display.book_ad_info = 2
 
             else:
-                self.save_page_html(self.parse_html(self.get_html(urljoin(self.base_url, self.filename)), is_cover))
+                if is_cover and self.no_cover:
+                    response = self.requests_provider(next_chapter["web_url"], update_cookies=False, stream=True)
+                    if response != 0:
+                        with open(os.path.join(self.BOOK_PATH, "OEBPS", "Images",
+                                  self.filename + "." + response.headers["Content-Type"].split("/")[-1]), 'wb') as s:
+                            for chunk in response.iter_content(1024):
+                                s.write(chunk)
+
+                        cover_html = self.parse_html(html.fromstring(
+                            "<div id=\"sbo-rt-content\"><img src=\"Images/{0}\"></div>".format(
+                                self.filename + "." + response.headers["Content-Type"].split("/")[-1]
+                            )
+                        ), is_cover)
+                        self.filename += ".xhtml"
+                        self.book_chapters[0]["filename"] += ".xhtml"
+                        self.save_page_html(cover_html)
+                        continue
+
+                self.save_page_html(self.parse_html(self.get_html(next_chapter["web_url"]), is_cover))
 
             self.display.state(len_books, len_books - len(self.chapters_queue))
 
@@ -769,7 +814,7 @@ def create_content_opf(self):
             spine.append("<itemref idref=\"{0}\"/>".format(item_id))
 
         alt_cover_id = False
-        for i in self.images:
+        for i in set(self.images):
             dot_split = i.split(".")
             head = "img_" + escape("".join(dot_split[:-1]))
             extension = dot_split[-1]
@@ -780,7 +825,7 @@ def create_content_opf(self):
             if not alt_cover_id:
                 alt_cover_id = head
 
-        for i in range(1, len(self.css) + 1):
+        for i in range(len(self.css)):
             manifest.append("<item id=\"style_{0:0>2}\" href=\"Styles/Style{0:0>2}.css\" "
                             "media-type=\"text/css\" />".format(i))
 
@@ -818,7 +863,7 @@ def parse_toc(l, c=0, mx=0):
                  "<navLabel><text>{2}</text></navLabel>" \
                  "<content src=\"{3}\"/>".format(
                     cc["fragment"] if len(cc["fragment"]) else cc["id"], c,
-                    escape(cc["label"]), cc["href"].replace(".html", ".xhtml")
+                    escape(cc["label"]), cc["href"].replace(".html", ".xhtml").split("/")[-1]
                  )
 
             if cc["children"]:

From 452148d40b3bb1e21bf8ad81bf41a6e850c60e1d Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 27 Feb 2018 15:13:12 +0100
Subject: [PATCH 032/100] General improvement Fixed #3 (Again)

---
 safaribooks.py | 158 +++++++++++++++++++++++++++----------------------
 1 file changed, 87 insertions(+), 71 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 97ca52b..b646174 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -290,15 +290,6 @@ def __init__(self, args):
         self.display.info("Retrieving book chapters...")
         self.book_chapters = self.get_book_chapters()
 
-        self.no_cover = False
-        if "cover" not in self.book_chapters[0]["filename"] or "cover" not in self.book_chapters[0]["title"]:
-            self.book_chapters = [{
-                "filename": "cover",
-                "title": "Cover",
-                "web_url": self.book_info["cover"]
-            }] + self.book_chapters
-            self.no_cover = True
-
         self.chapters_queue = self.book_chapters[:]
 
         if len(self.book_chapters) > sys.getrecursionlimit():
@@ -309,6 +300,8 @@ def __init__(self, args):
 
         self.clean_book_title = self.clean_dirname(self.book_title)
         self.BOOK_PATH = os.path.join(PATH, "Books", self.clean_book_title)
+        self.css_path = ""
+        self.images_path = ""
         self.create_dirs()
         self.display.info("Output directory:\n    %s" % self.BOOK_PATH)
 
@@ -320,11 +313,21 @@ def __init__(self, args):
         self.display.info("Downloading book contents... (%s chapters)" % len(self.book_chapters), state=True)
         self.BASE_HTML = self.BASE_01_HTML + (self.KINDLE_HTML if not args.no_kindle else "") + self.BASE_02_HTML
 
+        self.cover = False
         self.get()
+        if not self.cover:
+            self.cover = self.get_default_cover()
+            cover_html = self.parse_html(
+                html.fromstring("<div id=\"sbo-rt-content\"><img src=\"Images/{0}\"></div>".format(self.cover)), True
+            )
 
-        self.css_path = ""
-        self.images_path = ""
-        self.cover = ""
+            self.book_chapters = [{
+                "filename": "default_cover.xhtml",
+                "title": "Cover"
+            }] + self.book_chapters
+
+            self.filename = self.book_chapters[0]["filename"]
+            self.save_page_html(cover_html)
 
         self.css_done_queue = Queue(0) if "win" not in sys.platform else WinQueue()
         self.display.info("Downloading book CSSs... (%s files)" % len(self.css), state=True)
@@ -473,13 +476,26 @@ def get_book_chapters(self, page=1):
             sys.setrecursionlimit(response["count"])
 
         result = []
-        result.extend([c for c in response["results"] if "cover." in c["filename"]])
+        result.extend([c for c in response["results"] if "cover" in c["filename"] or "cover" in c["title"]])
         for c in result:
             del response["results"][response["results"].index(c)]
 
         result += response["results"]
         return result + (self.get_book_chapters(page + 1) if response["next"] else [])
 
+    def get_default_cover(self):
+        response = self.requests_provider(self.book_info["cover"], update_cookies=False, stream=True)
+        if response == 0:
+            self.display.error("Error trying to retrieve the cover: %s" % self.book_info["cover"])
+            return False
+
+        file_ext = response.headers["Content-Type"].split("/")[-1]
+        with open(os.path.join(self.images_path, "default_cover." + file_ext), 'wb') as i:
+            for chunk in response.iter_content(1024):
+                i.write(chunk)
+
+        return "default_cover." + file_ext
+
     def get_html(self, url):
         response = self.requests_provider(url)
         if response == 0:
@@ -508,9 +524,9 @@ def url_is_absolute(url):
     def link_replace(self, link):
         if link:
             if not self.url_is_absolute(link):
-                link = urljoin(self.base_url, link)
                 if "cover" in link or "images" in link or "graphics" in link or \
                         link[-3:] in ["jpg", "peg", "png", "gif"]:
+                    link = urljoin(self.base_url, link)
                     if link not in self.images:
                         self.images.append(link)
                         self.display.log("Crawler: found a new image at %s" % link)
@@ -520,9 +536,31 @@ def link_replace(self, link):
 
                 return link.replace(".html", ".xhtml")
 
+            else:
+                if self.book_id in link:
+                    return self.link_replace(link.split(self.book_id)[-1])
+
         return link
 
-    def parse_html(self, root, is_cover=False):
+    @staticmethod
+    def get_cover(html_root):
+        images = html_root.xpath("//img[contains(@id, 'cover') or "
+                                 "contains(@name, 'cover') or contains(@src, 'cover')]")
+        if len(images):
+            return images[0]
+
+        divs = html_root.xpath("//div[contains(@id, 'cover') or "
+                               "contains(@name, 'cover') or contains(@src, 'cover')]//img")
+        if len(divs):
+            return divs[0]
+
+        a = html_root.xpath("//a[contains(@id, 'cover') or contains(@name, 'cover') or contains(@src, 'cover')]//img")
+        if len(a):
+            return a[0]
+
+        return None
+
+    def parse_html(self, root, first_page=False):
         if random() > 0.5:
             if len(root.xpath("//div[@class='controls']/a/text()")):
                 self.display.exit(self.display.api_error(" "))
@@ -585,22 +623,23 @@ def parse_html(self, root, is_cover=False):
 
         xhtml = None
         try:
-            if is_cover:
-                page_css = "<style>" \
-                           "body{display:table;position:absolute;margin:0!important;height:100%;width:100%;}" \
-                           "#Cover{display:table-cell;vertical-align:middle;text-align:center;}" \
-                           "img{height:90vh;margin-left:auto;margin-right:auto;}" \
-                           "</style>"
-
-                cover_html = html.fromstring("<div id=\"Cover\"></div>")
-                cover_div = cover_html.xpath("//div")[0]
-
-                if len(book_content.xpath("//img")):
+            if first_page:
+                is_cover = self.get_cover(book_content)
+                if is_cover is not None:
+                    page_css = "<style>" \
+                               "body{display:table;position:absolute;margin:0!important;height:100%;width:100%;}" \
+                               "#Cover{display:table-cell;vertical-align:middle;text-align:center;}" \
+                               "img{height:90vh;margin-left:auto;margin-right:auto;}" \
+                               "</style>"
+                    cover_html = html.fromstring("<div id=\"Cover\"></div>")
+                    cover_div = cover_html.xpath("//div")[0]
                     cover_img = cover_div.makeelement("img")
-                    cover_img.attrib.update({"src": book_content.xpath("//img")[0].attrib["src"]})
+                    cover_img.attrib.update({"src": is_cover.attrib["src"]})
                     cover_div.append(cover_img)
                     book_content = cover_html
 
+                    self.cover = is_cover.attrib["src"]
+
             xhtml = html.tostring(book_content, method="xml", encoding='unicode')
 
         except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
@@ -620,7 +659,7 @@ def clean_dirname(dirname):
 
         for ch in ['\\', '/', '<', '>', '`', '\'', '"', '*', '?', '|']:
             if ch in dirname:
-                dirname = dirname.replace(ch, "_")
+                dirname = dirname.replace(ch, "")
 
         return dirname
 
@@ -636,6 +675,22 @@ def create_dirs(self):
             self.display.book_ad_info = True
             os.makedirs(oebps)
 
+        self.css_path = os.path.join(oebps, "Styles")
+        if os.path.isdir(self.css_path):
+            self.display.log("CSSs directory already exists: %s" % self.css_path)
+
+        else:
+            os.makedirs(self.css_path)
+            self.display.css_ad_info.value = 1
+
+        self.images_path = os.path.join(oebps, "Images")
+        if os.path.isdir(self.images_path):
+            self.display.log("Images directory already exists: %s" % self.images_path)
+
+        else:
+            os.makedirs(self.images_path)
+            self.display.images_ad_info.value = 1
+
     def save_page_html(self, contents):
         self.filename = self.filename.replace(".html", ".xhtml")
         open(os.path.join(self.BOOK_PATH, "OEBPS", self.filename), "wb")\
@@ -645,11 +700,11 @@ def save_page_html(self, contents):
     def get(self):
         len_books = len(self.book_chapters)
 
-        for _ in self.book_chapters:
+        for _ in range(len_books):
             if not len(self.chapters_queue):
                 return
 
-            is_cover = len_books == len(self.chapters_queue)
+            first_page = len_books == len(self.chapters_queue)
 
             next_chapter = self.chapters_queue.pop(0)
             self.chapter_title = next_chapter["title"]
@@ -671,25 +726,7 @@ def get(self):
                     self.display.book_ad_info = 2
 
             else:
-                if is_cover and self.no_cover:
-                    response = self.requests_provider(next_chapter["web_url"], update_cookies=False, stream=True)
-                    if response != 0:
-                        with open(os.path.join(self.BOOK_PATH, "OEBPS", "Images",
-                                  self.filename + "." + response.headers["Content-Type"].split("/")[-1]), 'wb') as s:
-                            for chunk in response.iter_content(1024):
-                                s.write(chunk)
-
-                        cover_html = self.parse_html(html.fromstring(
-                            "<div id=\"sbo-rt-content\"><img src=\"Images/{0}\"></div>".format(
-                                self.filename + "." + response.headers["Content-Type"].split("/")[-1]
-                            )
-                        ), is_cover)
-                        self.filename += ".xhtml"
-                        self.book_chapters[0]["filename"] += ".xhtml"
-                        self.save_page_html(cover_html)
-                        continue
-
-                self.save_page_html(self.parse_html(self.get_html(next_chapter["web_url"]), is_cover))
+                self.save_page_html(self.parse_html(self.get_html(next_chapter["web_url"]), first_page))
 
             self.display.state(len_books, len_books - len(self.chapters_queue))
 
@@ -756,14 +793,6 @@ def _start_multiprocessing(self, operation, full_queue):
                 proc.join()
 
     def collect_css(self):
-        self.css_path = os.path.join(self.BOOK_PATH, "OEBPS", "Styles")
-        if os.path.isdir(self.css_path):
-            self.display.log("CSSs directory already exists: %s" % self.css_path)
-
-        else:
-            os.makedirs(self.css_path)
-            self.display.css_ad_info.value = 1
-
         self.display.state_status.value = -1
 
         if "win" in sys.platform:
@@ -775,14 +804,6 @@ def collect_css(self):
             self._start_multiprocessing(self._thread_download_css, self.css)
 
     def collect_images(self):
-        self.images_path = os.path.join(self.BOOK_PATH, "OEBPS", "Images")
-        if os.path.isdir(self.images_path):
-            self.display.log("Images directory already exists: %s" % self.images_path)
-
-        else:
-            os.makedirs(self.images_path)
-            self.display.images_ad_info.value = 1
-
         if self.display.book_ad_info == 2:
             self.display.info("Some of the book contents were already downloaded.\n"
                               "    If you want to be sure that all the images will be downloaded,\n"
@@ -799,7 +820,6 @@ def collect_images(self):
             self._start_multiprocessing(self._thread_download_images, self.images)
 
     def create_content_opf(self):
-        self.cover = self.images[0] if len(self.images) else ""
         self.css = next(os.walk(self.css_path))[2]
         self.images = next(os.walk(self.images_path))[2]
 
@@ -813,7 +833,6 @@ def create_content_opf(self):
             ))
             spine.append("<itemref idref=\"{0}\"/>".format(item_id))
 
-        alt_cover_id = False
         for i in set(self.images):
             dot_split = i.split(".")
             head = "img_" + escape("".join(dot_split[:-1]))
@@ -822,9 +841,6 @@ def create_content_opf(self):
                 head, i, "jpeg" if "jp" in extension else extension
             ))
 
-            if not alt_cover_id:
-                alt_cover_id = head
-
         for i in range(len(self.css)):
             manifest.append("<item id=\"style_{0:0>2}\" href=\"Styles/Style{0:0>2}.css\" "
                             "media-type=\"text/css\" />".format(i))
@@ -845,7 +861,7 @@ def create_content_opf(self):
             ", ".join(escape(pub["name"]) for pub in self.book_info["publishers"]),
             escape(self.book_info["rights"]),
             self.book_info["issued"],
-            self.cover if self.cover else alt_cover_id,
+            self.cover,
             "\n".join(manifest),
             "\n".join(spine),
             self.book_chapters[0]["filename"].replace(".html", ".xhtml")

From 7526702f28c74c032986ba907b844f2904af40b0 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 1 Mar 2018 11:47:53 +0100
Subject: [PATCH 033/100] Fixed #7

---
 safaribooks.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index b646174..d1d83d1 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -299,7 +299,12 @@ def __init__(self, args):
         self.base_url = self.book_info["web_url"]
 
         self.clean_book_title = self.clean_dirname(self.book_title)
-        self.BOOK_PATH = os.path.join(PATH, "Books", self.clean_book_title)
+
+        books_dir = os.path.join(PATH, "Books")
+        if not os.path.isdir(books_dir):
+            os.mkdir(books_dir)
+
+        self.BOOK_PATH = os.path.join(books_dir, self.clean_book_title)
         self.css_path = ""
         self.images_path = ""
         self.create_dirs()

From 62caeae89e184ec2505aa1bb51a8140bf000cfb4 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 1 Mar 2018 12:06:17 +0100
Subject: [PATCH 034/100] Added support for pipenv

---
 Pipfile      |  17 +++++++++
 Pipfile.lock | 102 +++++++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 119 insertions(+)
 create mode 100644 Pipfile
 create mode 100644 Pipfile.lock

diff --git a/Pipfile b/Pipfile
new file mode 100644
index 0000000..c4608ad
--- /dev/null
+++ b/Pipfile
@@ -0,0 +1,17 @@
+[[source]]
+
+url = "https://pypi.python.org/simple"
+verify_ssl = true
+name = "pypi"
+
+[packages]
+
+lxml = "*"
+requests = "*"
+
+[dev-packages]
+
+
+[requires]
+
+python_version = "3.6"
diff --git a/Pipfile.lock b/Pipfile.lock
new file mode 100644
index 0000000..9d6b8e2
--- /dev/null
+++ b/Pipfile.lock
@@ -0,0 +1,102 @@
+{
+    "_meta": {
+        "hash": {
+            "sha256": "bdff55965f0e3fa7b2a9b0e9df281f33860d2ae44891a2916d0ae6ce1d8c4a19"
+        },
+        "host-environment-markers": {
+            "implementation_name": "cpython",
+            "implementation_version": "3.6.3",
+            "os_name": "posix",
+            "platform_machine": "x86_64",
+            "platform_python_implementation": "CPython",
+            "platform_release": "4.13.0-36-generic",
+            "platform_system": "Linux",
+            "platform_version": "#40-Ubuntu SMP Fri Feb 16 20:07:48 UTC 2018",
+            "python_full_version": "3.6.3",
+            "python_version": "3.6",
+            "sys_platform": "linux"
+        },
+        "pipfile-spec": 6,
+        "requires": {
+            "python_version": "3.6"
+        },
+        "sources": [
+            {
+                "name": "pypi",
+                "url": "https://pypi.python.org/simple",
+                "verify_ssl": true
+            }
+        ]
+    },
+    "default": {
+        "certifi": {
+            "hashes": [
+                "sha256:14131608ad2fd56836d33a71ee60fa1c82bc9d2c8d98b7bdbc631fe1b3cd1296",
+                "sha256:edbc3f203427eef571f79a7692bb160a2b0f7ccaa31953e99bd17e307cf63f7d"
+            ],
+            "version": "==2018.1.18"
+        },
+        "chardet": {
+            "hashes": [
+                "sha256:fc323ffcaeaed0e0a02bf4d117757b98aed530d9ed4531e3e15460124c106691",
+                "sha256:84ab92ed1c4d4f16916e05906b6b75a6c0fb5db821cc65e70cbd64a3e2a5eaae"
+            ],
+            "version": "==3.0.4"
+        },
+        "idna": {
+            "hashes": [
+                "sha256:8c7309c718f94b3a625cb648ace320157ad16ff131ae0af362c9f21b80ef6ec4",
+                "sha256:2c6a5de3089009e3da7c5dde64a141dbc8551d5b7f6cf4ed7c2568d0cc520a8f"
+            ],
+            "version": "==2.6"
+        },
+        "lxml": {
+            "hashes": [
+                "sha256:41f59cbdab232f11680d5d4dec9f2e6782fd24d78e37ee833447702e34e675f4",
+                "sha256:e7e41d383f19bab9d57f5f3b18d158655bcd682e7e723f441b9e183e1e35a6b5",
+                "sha256:155521c337acecf8202091cff85bb9f709f238130ebadf04280fb1db11f5ad8b",
+                "sha256:d2c985d2460b81c6ca5feb8b86f1bc594ad59405d0bdf68626b85852b701553c",
+                "sha256:950e63387514aa1b881eba5ac6cb2ec51a118b3dafe99dd80ca19d8fb0142f30",
+                "sha256:470d7ce41e8047208ba1a376560bad17f1468df1f3097bc83902b26cfafdbb0c",
+                "sha256:e608839a5ee2180164424ccf279c8e2d9bbe8816d002c58fd97d6b621ba4aa94",
+                "sha256:87a66bcadac270fc010cb029022a93fc722bf1204a8b03e782d4c790f0edf7ca",
+                "sha256:2dedfeeecc2d5a939cf622602f5a1ce443ca82407f386880f739f1a9f08053ad",
+                "sha256:ba05732e4bcf59e948f61588851dcf620fd60d5bbd9d704203e5f59bbaa60219",
+                "sha256:2190266059fec3c5a55f9d6c30532c64c6d414d3228909c0af573fe4907e78d1",
+                "sha256:dd291debfaa535d9cb6cee8d7aca2328775e037d02d13f1634e57f49bc302cc4",
+                "sha256:29a36e354c39b2e24bc4ee103de53417ebb80f976a6ab9e8d093d559e2ac03e1",
+                "sha256:e37427d5a27eefbcfc48847e0b37f348113fac7280bc857421db39ffc6372570",
+                "sha256:b106d4d2383382399ad82108fd187e92f40b1c90f55c2d36bbcb1c44bcf940fc",
+                "sha256:0ee07da52d240f1dc3c83eef5cd5f1b7f018226c1121f2a54d446645779a6d17",
+                "sha256:3b33549fb8f91b38a7500078242b03cca513f3412a2cdae722e89bf83f95971d",
+                "sha256:4c12e90886d9c53ab434c8d0cebea122321cce19614c3c6b6d1a7700d7cc6212",
+                "sha256:79322000279cda10b53c374d53ca632ead3bc51c6aebf8e62c8fa93a4d08b750",
+                "sha256:6cba398eb37e0631e60e0e080c101cfe91769b2c8267105b64b4625e2581ea21",
+                "sha256:49a655956f8de69e1258bc0fcfc43eb3bd1e038655784d77d1869b4b81444e37",
+                "sha256:af8a5373241d09b8fc53e0490e1719ce5dc90a21b19db89b6596c1adcdd52270",
+                "sha256:e6b6698415c7e8d227a47a3b1038e1b37c2b438a1b48c2db7ad9e74ddbcd1149",
+                "sha256:155c916cf2645b4a8f2bd5d09065e92d1b67b8d464bdc001e0b524af84bedf6f",
+                "sha256:fa7320679ced5e25b20203d157280680fc84eb783b6cc650cb0c98e1858b7dd3",
+                "sha256:4187c4b0cefc3353181db048c51f42c489d9ac51e40b86c4851dc0671372971d",
+                "sha256:d5d29663e979e83b3fc361e97200f959cddb3a14797391d15273d84a5a8ae44b",
+                "sha256:940caef1ec7c78e0c34b0f6b94fe42d0f2022915ffc78643d28538a5cfd0f40e"
+            ],
+            "version": "==4.1.1"
+        },
+        "requests": {
+            "hashes": [
+                "sha256:6a1b267aa90cac58ac3a765d067950e7dbbf75b1da07e895d1f594193a40a38b",
+                "sha256:9c443e7324ba5b85070c4a818ade28bfabedf16ea10206da1132edaa6dda237e"
+            ],
+            "version": "==2.18.4"
+        },
+        "urllib3": {
+            "hashes": [
+                "sha256:06330f386d6e4b195fbfc736b297f58c5a892e4440e54d294d7004e3a9bbea1b",
+                "sha256:cc44da8e1145637334317feebd728bd869a35285b93cbb4cca2577da7e62db4f"
+            ],
+            "version": "==1.22"
+        }
+    },
+    "develop": {}
+}

From af3238968193cbb53442ba2b2b78f6a5285b5cf7 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 1 Mar 2018 12:12:32 +0100
Subject: [PATCH 035/100] Update README.md

---
 README.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/README.md b/README.md
index 0700f36..81e4f88 100644
--- a/README.md
+++ b/README.md
@@ -15,6 +15,10 @@ Cloning into 'safaribooks'...
 
 $ cd safaribooks/
 $ pip3 install -r requirements.txt
+
+OR
+
+$ pipenv install && pipenv shell
 ```  
 
 The program depends of only two **Python 3** modules:

From d9689dbac3747a04cde8c5e0c32b37fccfe0f0d5 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 2 Mar 2018 09:43:19 +0100
Subject: [PATCH 036/100] Fixed book name duplicates

---
 safaribooks.py | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index d1d83d1..4c6a2f7 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -298,7 +298,9 @@ def __init__(self, args):
         self.book_title = self.book_info["title"]
         self.base_url = self.book_info["web_url"]
 
-        self.clean_book_title = self.clean_dirname(self.book_title)
+        self.clean_book_title = self.escape_dirname(self.book_title) + " ({0})".format(
+            self.escape_dirname(", ".join(a["name"] for a in self.book_info["authors"]), clean_space=True)
+        )
 
         books_dir = os.path.join(PATH, "Books")
         if not os.path.isdir(books_dir):
@@ -657,7 +659,7 @@ def parse_html(self, root, first_page=False):
         return page_css, xhtml
 
     @staticmethod
-    def clean_dirname(dirname):
+    def escape_dirname(dirname, clean_space=False):
         if ":" in dirname:
             if dirname.index(":") > 30:
                 dirname = dirname.split(":")[0]
@@ -666,11 +668,11 @@ def clean_dirname(dirname):
             if ch in dirname:
                 dirname = dirname.replace(ch, "")
 
-        return dirname
+        return dirname if not clean_space else dirname.replace(" ", "")
 
     def create_dirs(self):
         if os.path.isdir(self.BOOK_PATH):
-            self.display.log("Book directory already exists: %s" % self.book_title)
+            self.display.log("Book directory already exists: %s" % self.BOOK_PATH)
 
         else:
             os.makedirs(self.BOOK_PATH)

From ccd5c1398a7c92f643aac6f77b1fe809831b9933 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 2 Mar 2018 09:53:38 +0100
Subject: [PATCH 037/100] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 81e4f88..0045ed6 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # SafariBooks
 Download and generate *EPUB* of your favorite books from [*Safari Books Online*](https://www.safaribooksonline.com) library.  
-Use this program only for *personal* and/or *educational* purpose.  
+I'm not responsible for the use of this program, this is only for *personal* and *educational* purpose.  
 
 ## Overview:
   * [Requirements & Setup](#requirements--setup)

From be33390f82b8a99922729e79bf324b143c3e6df9 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 2 Mar 2018 14:38:56 +0100
Subject: [PATCH 038/100] Bug fixed

---
 safaribooks.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 4c6a2f7..2163223 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -660,9 +660,8 @@ def parse_html(self, root, first_page=False):
 
     @staticmethod
     def escape_dirname(dirname, clean_space=False):
-        if ":" in dirname:
-            if dirname.index(":") > 30:
-                dirname = dirname.split(":")[0]
+        if ":" in dirname and dirname.index(":") > 15:
+            dirname = dirname.split(":")[0]
 
         for ch in ['\\', '/', '<', '>', '`', '\'', '"', '*', '?', '|']:
             if ch in dirname:

From 27baf7314e2af488f8b9e62784bf072e47d3b1fe Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Sat, 3 Mar 2018 12:54:36 +0100
Subject: [PATCH 039/100] Fixed bug on `escape_dirname` func for Windows users.

---
 safaribooks.py | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 2163223..2a8790d 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -660,12 +660,16 @@ def parse_html(self, root, first_page=False):
 
     @staticmethod
     def escape_dirname(dirname, clean_space=False):
-        if ":" in dirname and dirname.index(":") > 15:
-            dirname = dirname.split(":")[0]
+        if ":" in dirname:
+            if dirname.index(":") > 15:
+                dirname = dirname.split(":")[0]
 
-        for ch in ['\\', '/', '<', '>', '`', '\'', '"', '*', '?', '|']:
+            elif "win" in sys.platform:
+                dirname = dirname.replace(":", ",")
+
+        for ch in ['~', '#', '%', '&', '*', '{', '}', '\\', '<', '>', '?', '/', '`', '\'', '"', '|', '+']:
             if ch in dirname:
-                dirname = dirname.replace(ch, "")
+                dirname = dirname.replace(ch, "_")
 
         return dirname if not clean_space else dirname.replace(" ", "")
 

From d96679c44de70550595ec7f7e41883bf7a58ce48 Mon Sep 17 00:00:00 2001
From: Max Romanovsky <max.romanovsky@gmail.com>
Date: Thu, 8 Mar 2018 19:54:28 +0100
Subject: [PATCH 040/100] fixes for missing isbn

---
 safaribooks.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 2a8790d..1412df1 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -863,7 +863,7 @@ def create_content_opf(self):
                              for sub in self.book_info["subjects"])
 
         return self.CONTENT_OPF.format(
-            (self.book_info["isbn"] if len(self.book_info["isbn"]) else self.book_id),
+            (self.book_info["isbn"] if (isinstance(self.book_info["isbn"], str) and len(self.book_info["isbn"])) else self.book_id),
             escape(self.book_title),
             authors,
             escape(self.book_info["description"]),
@@ -918,7 +918,7 @@ def create_toc(self):
 
         navmap, _, max_depth = self.parse_toc(response)
         return self.TOC_NCX.format(
-            (self.book_info["isbn"] if len(self.book_info["isbn"]) else self.book_id),
+            (self.book_info["isbn"] if (isinstance(self.book_info["isbn"], str) and len(self.book_info["isbn"])) else self.book_id),
             max_depth,
             self.book_title,
             ", ".join(aut["name"] for aut in self.book_info["authors"]),

From 18cc21485d29fe124b7d8b241daf33f0cb7108b4 Mon Sep 17 00:00:00 2001
From: Max Romanovsky <max.romanovsky@gmail.com>
Date: Fri, 9 Mar 2018 13:00:48 +0100
Subject: [PATCH 041/100] Update safaribooks.py

---
 safaribooks.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 1412df1..7b0e653 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -863,7 +863,7 @@ def create_content_opf(self):
                              for sub in self.book_info["subjects"])
 
         return self.CONTENT_OPF.format(
-            (self.book_info["isbn"] if (isinstance(self.book_info["isbn"], str) and len(self.book_info["isbn"])) else self.book_id),
+            (self.book_info["isbn"] if self.book_info["isbn"] else self.book_id),
             escape(self.book_title),
             authors,
             escape(self.book_info["description"]),
@@ -918,7 +918,7 @@ def create_toc(self):
 
         navmap, _, max_depth = self.parse_toc(response)
         return self.TOC_NCX.format(
-            (self.book_info["isbn"] if (isinstance(self.book_info["isbn"], str) and len(self.book_info["isbn"])) else self.book_id),
+            (self.book_info["isbn"] if self.book_info["isbn"] else self.book_id),
             max_depth,
             self.book_title,
             ", ".join(aut["name"] for aut in self.book_info["authors"]),

From 5e1eca240a89ff5aeafff27db7aa8b604bce2e26 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 12 Apr 2018 20:31:17 +0200
Subject: [PATCH 042/100] Fixed #10 Fixed #11 General improvement

---
 safaribooks.py | 28 ++++++++++++++++------------
 1 file changed, 16 insertions(+), 12 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 2a8790d..2bde385 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -53,6 +53,10 @@ def __init__(self, log_file):
         self.state_status = Value("i", 0)
         sys.excepthook = self.unhandled_exception
 
+    def unregister(self):
+        self.logger.handlers[0].close()
+        sys.excepthook = sys.__excepthook__
+
     def log(self, message):
         self.logger.info(str(message))
 
@@ -97,10 +101,10 @@ def save_last_request(self):
 
     def intro(self):
         output = self.SH_YELLOW + """
-       ____     ___         _ 
+       ____     ___         _
       / __/__ _/ _/__ _____(_)
-     _\ \/ _ `/ _/ _ `/ __/ / 
-    /___/\_,_/_/ \_,_/_/ /_/  
+     _\ \/ _ `/ _/ _ `/ __/ /
+    /___/\_,_/_/ \_,_/_/ /_/
       / _ )___  ___  / /__ ___
      / _  / _ \/ _ \/  '_/(_-<
     /____/\___/\___/_/\_\/___/
@@ -298,8 +302,8 @@ def __init__(self, args):
         self.book_title = self.book_info["title"]
         self.base_url = self.book_info["web_url"]
 
-        self.clean_book_title = self.escape_dirname(self.book_title) + " ({0})".format(
-            self.escape_dirname(", ".join(a["name"] for a in self.book_info["authors"]), clean_space=True)
+        self.clean_book_title = "".join(self.escape_dirname(self.book_title).split(",")[:2]) + " ({0})".format(
+            self.escape_dirname(", ".join(a["name"] for a in self.book_info["authors"][:2]), clean_space=True)
         )
 
         books_dir = os.path.join(PATH, "Books")
@@ -349,7 +353,8 @@ def __init__(self, args):
         if not args.no_cookies:
             json.dump(self.cookies, open(COOKIES_FILE, "w"))
 
-        self.display.done(self.clean_book_title + ".epub")
+        self.display.done(os.path.join(self.BOOK_PATH, self.book_id + ".epub"))
+        self.display.unregister()
 
         if not self.display.in_error and not args.log:
             os.remove(self.display.log_file)
@@ -551,17 +556,18 @@ def link_replace(self, link):
 
     @staticmethod
     def get_cover(html_root):
-        images = html_root.xpath("//img[contains(@id, 'cover') or "
+        images = html_root.xpath("//img[contains(@id, 'cover') or contains(@class, 'cover') or"
                                  "contains(@name, 'cover') or contains(@src, 'cover')]")
         if len(images):
             return images[0]
 
-        divs = html_root.xpath("//div[contains(@id, 'cover') or "
+        divs = html_root.xpath("//div[contains(@id, 'cover') or contains(@class, 'cover') or"
                                "contains(@name, 'cover') or contains(@src, 'cover')]//img")
         if len(divs):
             return divs[0]
 
-        a = html_root.xpath("//a[contains(@id, 'cover') or contains(@name, 'cover') or contains(@src, 'cover')]//img")
+        a = html_root.xpath("//a[contains(@id, 'cover') or contains(@class, 'cover') or"
+                            "contains(@name, 'cover') or contains(@src, 'cover')]//img")
         if len(a):
             return a[0]
 
@@ -945,13 +951,11 @@ def create_epub(self):
         )
 
         zip_file = os.path.join(PATH, "Books", self.book_id)
-        if os.path.isfile(zip_file + ".epub"):
-            os.remove(zip_file + ".epub")
         if os.path.isfile(zip_file + ".zip"):
             os.remove(zip_file + ".zip")
 
         shutil.make_archive(zip_file, 'zip', self.BOOK_PATH)
-        os.rename(zip_file + ".zip", os.path.join(self.BOOK_PATH, self.clean_book_title) + ".epub")
+        os.rename(zip_file + ".zip", os.path.join(self.BOOK_PATH, self.book_id) + ".epub")
 
 
 # MAIN

From a4ee173dc766efb7bbb07e7974c9962ca2af068d Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 25 Apr 2018 12:54:21 +0200
Subject: [PATCH 043/100] Fixed #12

---
 safaribooks.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index ac07e7a..6748c40 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -302,9 +302,8 @@ def __init__(self, args):
         self.book_title = self.book_info["title"]
         self.base_url = self.book_info["web_url"]
 
-        self.clean_book_title = "".join(self.escape_dirname(self.book_title).split(",")[:2]) + " ({0})".format(
-            self.escape_dirname(", ".join(a["name"] for a in self.book_info["authors"][:2]), clean_space=True)
-        )
+        self.clean_book_title = "".join(self.escape_dirname(self.book_title).split(",")[:2]) \
+                                + " ({0})".format(self.book_id)
 
         books_dir = os.path.join(PATH, "Books")
         if not os.path.isdir(books_dir):

From a1c9bb94b6f668f522137857fef21704c9f5de43 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 16 May 2018 23:07:45 +0200
Subject: [PATCH 044/100] Cover image improvement

---
 safaribooks.py | 20 ++++++++++++--------
 1 file changed, 12 insertions(+), 8 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 6748c40..04e8a3e 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -8,7 +8,7 @@
 import argparse
 import requests
 import traceback
-from lxml import html
+from lxml import html, etree
 from html import escape
 from random import random
 from multiprocessing import Process, Queue, Value
@@ -169,7 +169,7 @@ def api_error(response):
         return message
 
 
-class WinQueue(list):  # TODO: error while use Process in Windows: can't pickle _thread.RLock objects
+class WinQueue(list):  # TODO: error while use `process` in Windows: can't pickle _thread.RLock objects
     def put(self, el):
         self.append(el)
 
@@ -555,18 +555,22 @@ def link_replace(self, link):
 
     @staticmethod
     def get_cover(html_root):
-        images = html_root.xpath("//img[contains(@id, 'cover') or contains(@class, 'cover') or"
-                                 "contains(@name, 'cover') or contains(@src, 'cover')]")
+        lowercase_ns = etree.FunctionNamespace(None)
+        lowercase_ns["lower-case"] = lambda _, n: n[0].lower() if n and len(n) else ""
+
+        images = html_root.xpath("//img[contains(lower-case(@id), 'cover') or contains(lower-case(@class), 'cover') or"
+                                 "contains(lower-case(@name), 'cover') or contains(lower-case(@src), 'cover') or"
+                                 "contains(lower-case(@alt), 'cover')]")
         if len(images):
             return images[0]
 
-        divs = html_root.xpath("//div[contains(@id, 'cover') or contains(@class, 'cover') or"
-                               "contains(@name, 'cover') or contains(@src, 'cover')]//img")
+        divs = html_root.xpath("//div[contains(lower-case(@id), 'cover') or contains(lower-case(@class), 'cover') or"
+                               "contains(lower-case(@name), 'cover') or contains(lower-case(@src), 'cover')]//img")
         if len(divs):
             return divs[0]
 
-        a = html_root.xpath("//a[contains(@id, 'cover') or contains(@class, 'cover') or"
-                            "contains(@name, 'cover') or contains(@src, 'cover')]//img")
+        a = html_root.xpath("//a[contains(lower-case(@id), 'cover') or contains(lower-case(@class), 'cover') or"
+                            "contains(lower-case(@name), 'cover') or contains(lower-case(@src), 'cover')]//img")
         if len(a):
             return a[0]
 

From f69ba7eedd0b87f475b041ed3c474680bab4a324 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 21 May 2018 21:34:45 +0200
Subject: [PATCH 045/100] Update README.md

---
 README.md | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 0045ed6..09ab01b 100644
--- a/README.md
+++ b/README.md
@@ -70,10 +70,12 @@ optional arguments:
 ```
   
 The first time you'll use the program, you'll have to specify your Safari Books Online account credentials. 
-For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json` (see file format [`here`](/../../issues/2#issuecomment-367726544)). 
+For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json` (for **SSO** look file format [`here`](/../../issues/2#issuecomment-367726544)). 
   
 Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
-If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.  
+If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.
+
+You can configure proxies by setting on your system the environment variables `HTTP_PROXY` and `HTTPS_PROXY`.
 
 The program default options are thought for ensure best compatibilities for who want to export the `EPUB` to E-Readers like Amazon Kindle. If you want to do it, I suggest you to convert the `EPUB` to `AZW3` with [Calibre](https://calibre-ebook.com/).  
 You can also convert the book to `MOBI` and if you'll do it with Calibre be sure to select `Ignore margins` in the conversion options:  

From aaa8176a7661774114a2f6a3e6e585bca3b5df62 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 21 May 2018 21:42:08 +0200
Subject: [PATCH 046/100] Added credential parser

---
 safaribooks.py | 107 ++++++++++++++++++++++++++++---------------------
 1 file changed, 61 insertions(+), 46 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 04e8a3e..f155278 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -280,7 +280,7 @@ def __init__(self, args):
 
         else:
             self.display.info("Logging into Safari Books Online...", state=True)
-            self.do_login(*[c.replace("'", "").replace('"', "") for c in args.cred])
+            self.do_login(*args.cred)
             if not args.no_cookies:
                 json.dump(self.cookies, open(COOKIES_FILE, "w"))
 
@@ -402,6 +402,20 @@ def requests_provider(self, url, post=False, data=None, update_cookies=True, **k
 
         return response
 
+    @staticmethod
+    def parse_cred(cred):
+        if ":" not in cred:
+            return False
+
+        sep = cred.index(":")
+        new_cred = ["", ""]
+        new_cred[0] = cred[:sep].strip("'").strip('"')
+        if "@" not in new_cred[0]:
+            return False
+
+        new_cred[1] = cred[sep + 1:]
+        return new_cred
+
     def do_login(self, email, password):
         response = self.requests_provider(self.BASE_URL)
         if response == 0:
@@ -962,48 +976,49 @@ def create_epub(self):
 
 
 # MAIN
-arguments = argparse.ArgumentParser(prog="safaribooks.py",
-                                    description="Download and generate an EPUB of your favorite books"
-                                                " from Safari Books Online.",
-                                    add_help=False,
-                                    allow_abbrev=False)
-
-arguments.add_argument(
-    "--cred", metavar="<EMAIL:PASS>", default=False,
-    help="Credentials used to perform the auth login on Safari Books Online."
-         " Es. ` --cred \"account_mail@mail.com:password01\" `."
-)
-arguments.add_argument(
-    "--no-cookies", dest="no_cookies", action='store_true',
-    help="Prevent your session data to be saved into `cookies.json` file."
-)
-arguments.add_argument(
-    "--no-kindle", dest="no_kindle", action='store_true',
-    help="Remove some CSS rules that block overflow on `table` and `pre` elements."
-         " Use this option if you're not going to export the EPUB to E-Readers like Amazon Kindle."
-)
-arguments.add_argument(
-    "--preserve-log", dest="log", action='store_true', help="Leave the `info_XXXXXXXXXXXXX.log`"
-                                                            " file even if there isn't any error."
-)
-arguments.add_argument("--help", action="help", default=argparse.SUPPRESS, help='Show this help message.')
-arguments.add_argument(
-    "bookid", metavar='<BOOK ID>',
-    help="Book digits ID that you want to download. You can find it in the URL (X-es):"
-         " `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`"
-)
-
-args_parsed = arguments.parse_args()
-
-if args_parsed.cred:
-    cred = args_parsed.cred.split(":")
-    if len(cred) != 2 or "@" not in cred[0]:
-        arguments.error("invalid credential: %s" % args_parsed.cred)
-
-    args_parsed.cred = cred
-
-else:
-    if args_parsed.no_cookies:
-        arguments.error("invalid option: `--no-cookies` is valid only if you use the `--cred` option")
-
-SafariBooks(args_parsed)
+if __name__ == "__main__":
+    arguments = argparse.ArgumentParser(prog="safaribooks.py",
+                                        description="Download and generate an EPUB of your favorite books"
+                                                    " from Safari Books Online.",
+                                        add_help=False,
+                                        allow_abbrev=False)
+
+    arguments.add_argument(
+        "--cred", metavar="<EMAIL:PASS>", default=False,
+        help="Credentials used to perform the auth login on Safari Books Online."
+             " Es. ` --cred \"account_mail@mail.com:password01\" `."
+    )
+    arguments.add_argument(
+        "--no-cookies", dest="no_cookies", action='store_true',
+        help="Prevent your session data to be saved into `cookies.json` file."
+    )
+    arguments.add_argument(
+        "--no-kindle", dest="no_kindle", action='store_true',
+        help="Remove some CSS rules that block overflow on `table` and `pre` elements."
+             " Use this option if you're not going to export the EPUB to E-Readers like Amazon Kindle."
+    )
+    arguments.add_argument(
+        "--preserve-log", dest="log", action='store_true', help="Leave the `info_XXXXXXXXXXXXX.log`"
+                                                                " file even if there isn't any error."
+    )
+    arguments.add_argument("--help", action="help", default=argparse.SUPPRESS, help='Show this help message.')
+    arguments.add_argument(
+        "bookid", metavar='<BOOK ID>',
+        help="Book digits ID that you want to download. You can find it in the URL (X-es):"
+             " `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`"
+    )
+
+    args_parsed = arguments.parse_args()
+
+    if args_parsed.cred:
+        cred = SafariBooks.parse_cred(args_parsed.cred)
+        if not cred:
+            arguments.error("invalid credential: %s" % args_parsed.cred)
+
+        args_parsed.cred = cred
+
+    else:
+        if args_parsed.no_cookies:
+            arguments.error("invalid option: `--no-cookies` is valid only if you use the `--cred` option")
+
+    SafariBooks(args_parsed)

From b76e768c389796de1842fce525ede34a1b089f0a Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 21 May 2018 22:36:05 +0200
Subject: [PATCH 047/100] Update README.md

---
 README.md | 14 ++++++++++----
 1 file changed, 10 insertions(+), 4 deletions(-)

diff --git a/README.md b/README.md
index 09ab01b..d9cbe86 100644
--- a/README.md
+++ b/README.md
@@ -69,11 +69,11 @@ optional arguments:
   --help               Show this help message.
 ```
   
-The first time you'll use the program, you'll have to specify your Safari Books Online account credentials. 
-For the next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json` (for **SSO** look file format [`here`](/../../issues/2#issuecomment-367726544)). 
+The first time you use the program, you'll have to specify your Safari Books Online account credentials (look [`here`](/../../issues/15) for special character).
+The next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json` (for **SSO** look the file format [`here`](/../../issues/2#issuecomment-367726544)). 
   
 Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
-If you don't want to cache the cookies, just use the `--no-cookies` option and provide all the time your `--cred`.
+If you don't want to cache the cookies, just use the `--no-cookies` option and provide all time your `--cred`.
 
 You can configure proxies by setting on your system the environment variables `HTTP_PROXY` and `HTTPS_PROXY`.
 
@@ -106,7 +106,13 @@ In the other hand, if you're not going to export the `EPUB`, you can use the `--
     [-] ISBN: 9781491958704                                                         
     [-] Publishers: O'Reilly Media, Inc.                                            
     [-] Rights: Copyright © O'Reilly Media, Inc.                                    
-    [-] Description: By taking you through the development of a real web application from beginning to end, the second edition of this hands-on guide demonstrates the practical advantages of test-driven development (TDD) with Python. You’ll learn how to write and run tests before building each part of your app, and then develop the minimum amount of code required to pass those tests. The result? Clean code that works.In the process, you’ll learn the basics of Django, Selenium, Git, jQuery, and Mock, along with curre...
+    [-] Description: By taking you through the development of a real web application 
+    from beginning to end, the second edition of this hands-on guide demonstrates the 
+    practical advantages of test-driven development (TDD) with Python. You’ll learn 
+    how to write and run tests before building each part of your app, and then develop
+    the minimum amount of code required to pass those tests. The result? Clean code
+    that works.In the process, you’ll learn the basics of Django, Selenium, Git, 
+    jQuery, and Mock, along with curre...
     [-] Release Date: 2017-08-18
     [-] URL: https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/
     [*] Retrieving book chapters...                                                          

From 082c7a929bc21625a144a3bb7e48fc821564b991 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 11 Jul 2018 15:36:18 +0200
Subject: [PATCH 048/100] Fixed #21

---
 safaribooks.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index f155278..3e6ce31 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -181,7 +181,7 @@ class SafariBooks:
 
     HEADERS = {
         "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8",
-        "accept-encoding": "gzip, deflate, br",
+        "accept-encoding": "gzip, deflate",
         "accept-language": "it-IT,it;q=0.9,en-US;q=0.8,en;q=0.7",
         "cache-control": "no-cache",
         "cookie": "",
@@ -780,8 +780,7 @@ def _thread_download_css(self, url):
                 self.display.error("Error trying to retrieve this CSS: %s\n    From: %s" % (css_file, url))
 
             with open(css_file, 'wb') as s:
-                for chunk in response.iter_content(1024):
-                    s.write(chunk)
+                s.write(response.content)
 
         self.css_done_queue.put(1)
         self.display.state(len(self.css), self.css_done_queue.qsize())

From b276f67da171cd59e5de1495b5ee3ea4b4cf30b5 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 3 Aug 2018 09:57:53 +0200
Subject: [PATCH 049/100] Bug fixes

---
 safaribooks.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 3e6ce31..7edec1f 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -88,7 +88,7 @@ def exit(self, error):
         self.out(output)
 
         self.save_last_request()
-        sys.exit(128)
+        sys.exit(1)
 
     def unhandled_exception(self, _, o, tb):
         self.log("".join(traceback.format_tb(tb)))
@@ -523,7 +523,7 @@ def get_default_cover(self):
 
     def get_html(self, url):
         response = self.requests_provider(url)
-        if response == 0:
+        if response == 0 or response.status_code != 200:
             self.display.exit(
                 "Crawler: error trying to retrieve this page: %s (%s)\n    From: %s" %
                 (self.filename, self.chapter_title, url)

From 34d2cad294dd8b520bf20b8c386dd0970b7ebe1e Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 19 Oct 2018 10:01:13 +0200
Subject: [PATCH 050/100] Fixed #37

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index 7edec1f..0067c8d 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -58,7 +58,7 @@ def unregister(self):
         sys.excepthook = sys.__excepthook__
 
     def log(self, message):
-        self.logger.info(str(message))
+        self.logger.info(str(message).encode("utf-8", "replace"))
 
     def out(self, put):
         sys.stdout.write("\r" + " " * self.columns + "\r" + put + "\n")

From cee0a0c4dfea608a315d04bae9bccc87f1f9e53d Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 29 Oct 2018 20:36:47 +0100
Subject: [PATCH 051/100] Fix vulnerable 'requests' library

---
 requirements.txt | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/requirements.txt b/requirements.txt
index 6964772..2666c38 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,2 +1,3 @@
 lxml>=4.1.1
-requests>=2.18.4
+requests>=2.20.0
+

From 5873ec80b2feedffb5f0e11c93779cf1102c4004 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 29 Oct 2018 20:41:38 +0100
Subject: [PATCH 052/100] Fix vulnerable  library

---
 Pipfile.lock | 92 +++++++++++++++++++++++++++-------------------------
 1 file changed, 47 insertions(+), 45 deletions(-)

diff --git a/Pipfile.lock b/Pipfile.lock
index 9d6b8e2..ee72369 100644
--- a/Pipfile.lock
+++ b/Pipfile.lock
@@ -5,14 +5,14 @@
         },
         "host-environment-markers": {
             "implementation_name": "cpython",
-            "implementation_version": "3.6.3",
+            "implementation_version": "3.6.5",
             "os_name": "posix",
             "platform_machine": "x86_64",
             "platform_python_implementation": "CPython",
-            "platform_release": "4.13.0-36-generic",
+            "platform_release": "4.15.0-36-generic",
             "platform_system": "Linux",
-            "platform_version": "#40-Ubuntu SMP Fri Feb 16 20:07:48 UTC 2018",
-            "python_full_version": "3.6.3",
+            "platform_version": "#39-Ubuntu SMP Mon Sep 24 16:19:09 UTC 2018",
+            "python_full_version": "3.6.5",
             "python_version": "3.6",
             "sys_platform": "linux"
         },
@@ -31,10 +31,10 @@
     "default": {
         "certifi": {
             "hashes": [
-                "sha256:14131608ad2fd56836d33a71ee60fa1c82bc9d2c8d98b7bdbc631fe1b3cd1296",
-                "sha256:edbc3f203427eef571f79a7692bb160a2b0f7ccaa31953e99bd17e307cf63f7d"
+                "sha256:339dc09518b07e2fa7eda5450740925974815557727d6bd35d319c1524a04a4c",
+                "sha256:6d58c986d22b038c8c0df30d639f23a3e6d172a05c3583e766f4c0b785c0986a"
             ],
-            "version": "==2018.1.18"
+            "version": "==2018.10.15"
         },
         "chardet": {
             "hashes": [
@@ -45,57 +45,59 @@
         },
         "idna": {
             "hashes": [
-                "sha256:8c7309c718f94b3a625cb648ace320157ad16ff131ae0af362c9f21b80ef6ec4",
-                "sha256:2c6a5de3089009e3da7c5dde64a141dbc8551d5b7f6cf4ed7c2568d0cc520a8f"
+                "sha256:156a6814fb5ac1fc6850fb002e0852d56c0c8d2531923a51032d1b70760e186e",
+                "sha256:684a38a6f903c1d71d6d5fac066b58d7768af4de2b832e426ec79c30daa94a16"
             ],
-            "version": "==2.6"
+            "version": "==2.7"
         },
         "lxml": {
             "hashes": [
-                "sha256:41f59cbdab232f11680d5d4dec9f2e6782fd24d78e37ee833447702e34e675f4",
-                "sha256:e7e41d383f19bab9d57f5f3b18d158655bcd682e7e723f441b9e183e1e35a6b5",
-                "sha256:155521c337acecf8202091cff85bb9f709f238130ebadf04280fb1db11f5ad8b",
-                "sha256:d2c985d2460b81c6ca5feb8b86f1bc594ad59405d0bdf68626b85852b701553c",
-                "sha256:950e63387514aa1b881eba5ac6cb2ec51a118b3dafe99dd80ca19d8fb0142f30",
-                "sha256:470d7ce41e8047208ba1a376560bad17f1468df1f3097bc83902b26cfafdbb0c",
-                "sha256:e608839a5ee2180164424ccf279c8e2d9bbe8816d002c58fd97d6b621ba4aa94",
-                "sha256:87a66bcadac270fc010cb029022a93fc722bf1204a8b03e782d4c790f0edf7ca",
-                "sha256:2dedfeeecc2d5a939cf622602f5a1ce443ca82407f386880f739f1a9f08053ad",
-                "sha256:ba05732e4bcf59e948f61588851dcf620fd60d5bbd9d704203e5f59bbaa60219",
-                "sha256:2190266059fec3c5a55f9d6c30532c64c6d414d3228909c0af573fe4907e78d1",
-                "sha256:dd291debfaa535d9cb6cee8d7aca2328775e037d02d13f1634e57f49bc302cc4",
-                "sha256:29a36e354c39b2e24bc4ee103de53417ebb80f976a6ab9e8d093d559e2ac03e1",
-                "sha256:e37427d5a27eefbcfc48847e0b37f348113fac7280bc857421db39ffc6372570",
-                "sha256:b106d4d2383382399ad82108fd187e92f40b1c90f55c2d36bbcb1c44bcf940fc",
-                "sha256:0ee07da52d240f1dc3c83eef5cd5f1b7f018226c1121f2a54d446645779a6d17",
-                "sha256:3b33549fb8f91b38a7500078242b03cca513f3412a2cdae722e89bf83f95971d",
-                "sha256:4c12e90886d9c53ab434c8d0cebea122321cce19614c3c6b6d1a7700d7cc6212",
-                "sha256:79322000279cda10b53c374d53ca632ead3bc51c6aebf8e62c8fa93a4d08b750",
-                "sha256:6cba398eb37e0631e60e0e080c101cfe91769b2c8267105b64b4625e2581ea21",
-                "sha256:49a655956f8de69e1258bc0fcfc43eb3bd1e038655784d77d1869b4b81444e37",
-                "sha256:af8a5373241d09b8fc53e0490e1719ce5dc90a21b19db89b6596c1adcdd52270",
-                "sha256:e6b6698415c7e8d227a47a3b1038e1b37c2b438a1b48c2db7ad9e74ddbcd1149",
-                "sha256:155c916cf2645b4a8f2bd5d09065e92d1b67b8d464bdc001e0b524af84bedf6f",
-                "sha256:fa7320679ced5e25b20203d157280680fc84eb783b6cc650cb0c98e1858b7dd3",
-                "sha256:4187c4b0cefc3353181db048c51f42c489d9ac51e40b86c4851dc0671372971d",
-                "sha256:d5d29663e979e83b3fc361e97200f959cddb3a14797391d15273d84a5a8ae44b",
-                "sha256:940caef1ec7c78e0c34b0f6b94fe42d0f2022915ffc78643d28538a5cfd0f40e"
+                "sha256:fa39ea60d527fbdd94215b5e5552f1c6a912624521093f1384a491a8ad89ad8b",
+                "sha256:ae07fa0c115733fce1e9da96a3ac3fa24801742ca17e917e0c79d63a01eeb843",
+                "sha256:caf0e50b546bb60dfa99bb18dfa6748458a83131ecdceaf5c071d74907e7e78a",
+                "sha256:abf181934ac3ef193832fb973fd7f6149b5c531903c2ec0f1220941d73eee601",
+                "sha256:62939a8bb6758d1bf923aa1c13f0bcfa9bf5b2fc0f5fa917a6e25db5fe0cfa4e",
+                "sha256:4815892904c336bbaf73dafd54f45f69f4021c22b5bad7332176bbf4fb830568",
+                "sha256:81992565b74332c7c1aff6a913a3e906771aa81c9d0c68c68113cffcae45bc53",
+                "sha256:02bc220d61f46e9b9d5a53c361ef95e9f5e1d27171cd461dddb17677ae2289a5",
+                "sha256:bccb267678b870d9782c3b44d0cefe3ba0e329f9af8c946d32bf3778e7a4f271",
+                "sha256:2f31145c7ff665b330919bfa44aacd3a0211a76ca7e7b441039d2a0b0451e415",
+                "sha256:aab09fbe8abfa3b9ce62aaf45aca2d28726b1b9ee44871dbe644050a2fff4940",
+                "sha256:b9c78242219f674ab645ec571c9a95d70f381319a23911941cd2358a8e0521cf",
+                "sha256:a623965c086a6e91bb703d4da62dabe59fe88888e82c4117d544e11fd74835d6",
+                "sha256:9d862e3cf4fc1f2837dedce9c42269c8c76d027e49820a548ac89fdcee1e361f",
+                "sha256:5be031b0f15ad63910d8e5038b489d95a79929513b3634ad4babf77100602588",
+                "sha256:75830c06a62fe7b8fe3bbb5f269f0b308f19f3949ac81cfd40062f47c1455faf",
+                "sha256:a7783ab7f6a508b0510490cef9f857b763d796ba7476d9703f89722928d1e113",
+                "sha256:e16e07a0ec3a75b5ee61f2b1003c35696738f937dc8148fbda9fe2147ccb6e61",
+                "sha256:438a1b0203545521f6616132bfe0f4bca86f8a401364008b30e2b26ec408ce85",
+                "sha256:8c892fb0ee52c594d9a7751c7d7356056a9682674b92cc1c4dc968ff0f30c52f",
+                "sha256:c4df4d27f4c93b2cef74579f00b1d3a31a929c7d8023f870c4b476f03a274db4",
+                "sha256:22f253b542a342755f6cfc047fe4d3a296515cf9b542bc6e261af45a80b8caf6",
+                "sha256:e175a006725c7faadbe69e791877d09936c0ef2cf49d01b60a6c1efcb0e8be6f",
+                "sha256:edd9c13a97f6550f9da2236126bb51c092b3b1ce6187f2bd966533ad794bbb5e",
+                "sha256:dbbd5cf7690a40a9f0a9325ab480d0fccf46d16b378eefc08e195d84299bfae1",
+                "sha256:db0d213987bcd4e6d41710fb4532b22315b0d8fb439ff901782234456556aed1",
+                "sha256:60842230678674cdac4a1cf0f707ef12d75b9a4fc4a565add4f710b5fcf185d5",
+                "sha256:5c93ae37c3c588e829b037fdfbd64a6e40c901d3f93f7beed6d724c44829a3ad",
+                "sha256:d3266bd3ac59ac4edcd5fa75165dee80b94a3e5c91049df5f7c057ccf097551c",
+                "sha256:36720698c29e7a9626a0dc802ef8885f8f0239bfd1689628ecd459a061f2807f"
             ],
-            "version": "==4.1.1"
+            "version": "==4.2.5"
         },
         "requests": {
             "hashes": [
-                "sha256:6a1b267aa90cac58ac3a765d067950e7dbbf75b1da07e895d1f594193a40a38b",
-                "sha256:9c443e7324ba5b85070c4a818ade28bfabedf16ea10206da1132edaa6dda237e"
+                "sha256:a84b8c9ab6239b578f22d1c21d51b696dcfe004032bb80ea832398d6909d7279",
+                "sha256:99dcfdaaeb17caf6e526f32b6a7b780461512ab3f1d992187801694cba42770c"
             ],
-            "version": "==2.18.4"
+            "version": "==2.20.0"
         },
         "urllib3": {
             "hashes": [
-                "sha256:06330f386d6e4b195fbfc736b297f58c5a892e4440e54d294d7004e3a9bbea1b",
-                "sha256:cc44da8e1145637334317feebd728bd869a35285b93cbb4cca2577da7e62db4f"
+                "sha256:8819bba37a02d143296a4d032373c4dd4aca11f6d4c9973335ca75f9c8475f59",
+                "sha256:41c3db2fc01e5b907288010dec72f9d0a74e37d6994e6eb56849f59fea2265ae"
             ],
-            "version": "==1.22"
+            "version": "==1.24"
         }
     },
     "develop": {}

From a90362fd287f88d7fe316d0aa7206516fa4649c2 Mon Sep 17 00:00:00 2001
From: Krzysztof Barczynski <gadolin@gmail.com>
Date: Mon, 3 Dec 2018 20:40:42 -0600
Subject: [PATCH 053/100] Fixed login url

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index 0067c8d..46720bc 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -417,7 +417,7 @@ def parse_cred(cred):
         return new_cred
 
     def do_login(self, email, password):
-        response = self.requests_provider(self.BASE_URL)
+        response = self.requests_provider("https://www.safaribooksonline.com/accounts/login")
         if response == 0:
             self.display.exit("Login: unable to reach Safari Books Online. Try again...")
 

From 65b9e4b140003eaf24f72301200f918e2a6a5b0c Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Tue, 4 Dec 2018 11:36:50 +0100
Subject: [PATCH 054/100] Update safaribooks.py

Reuse global variable
---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index 46720bc..d6b6df9 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -417,7 +417,7 @@ def parse_cred(cred):
         return new_cred
 
     def do_login(self, email, password):
-        response = self.requests_provider("https://www.safaribooksonline.com/accounts/login")
+        response = self.requests_provider(self.LOGIN_URL)
         if response == 0:
             self.display.exit("Login: unable to reach Safari Books Online. Try again...")
 

From 6d8f222279eb9151e73f627fb47ce273d1c1f596 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 3 Jan 2019 14:30:14 +0100
Subject: [PATCH 055/100] Fixed #51 Fixed #56 Fixed #58 Fixed #59 Fixed #61

---
 safaribooks.py | 63 ++++++++++++++++++++++++++------------------------
 1 file changed, 33 insertions(+), 30 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index d6b6df9..1f96b94 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -18,6 +18,10 @@
 PATH = os.path.dirname(os.path.realpath(__file__))
 COOKIES_FILE = os.path.join(PATH, "cookies.json")
 
+SAFARI_BASE_HOST = "learning.oreilly.com"
+SAFARI_BASE_URL = "https://" + SAFARI_BASE_HOST
+
+
 
 class Display:
     BASE_FORMAT = logging.Formatter(
@@ -145,11 +149,11 @@ def state(self, origin, done):
             )
 
     def done(self, epub_file):
-        self.info("Done: %s\n\n"
+        self.info("Done: %s\n\n" % epub_file +
                   "    If you like it, please * this project on GitHub to make it known:\n"
                   "        https://github.com/lorenzodifuccia/safaribooks\n"
                   "    e don't forget to renew your Safari Books Online subscription:\n"
-                  "        https://www.safaribooksonline.com/signup/\n\n" % epub_file +
+                  "        " + SAFARI_BASE_URL + "\n\n" +
                   self.SH_BG_RED + "[!]" + self.SH_DEFAULT + " Bye!!")
 
     @staticmethod
@@ -158,7 +162,7 @@ def api_error(response):
         if "detail" in response and "Not found" in response["detail"]:
             message += "book's not present in Safari Books Online.\n" \
                        "    The book identifier is the digits that you can find in the URL:\n" \
-                       "    `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`"
+                       "    `" + SAFARI_BASE_URL + "/library/view/book-name/XXXXXXXXXXXXX/`"
 
         else:
             os.remove(COOKIES_FILE)
@@ -179,6 +183,9 @@ def qsize(self):
 
 class SafariBooks:
 
+    LOGIN_URL = SAFARI_BASE_URL + "/accounts/login/"
+    API_TEMPLATE = SAFARI_BASE_URL + "/api/v1/book/{0}/"
+
     HEADERS = {
         "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8",
         "accept-encoding": "gzip, deflate",
@@ -186,16 +193,13 @@ class SafariBooks:
         "cache-control": "no-cache",
         "cookie": "",
         "pragma": "no-cache",
-        "referer": "https://www.safaribooksonline.com/home/",
+        "origin": SAFARI_BASE_URL,
+        "referer": LOGIN_URL,
         "upgrade-insecure-requests": "1",
-        "user-agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) "
-                      "Chrome/62.0.3202.94 Safari/537.36"
+        "user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
+                      "Chrome/60.0.3112.113 Safari/537.36"
     }
 
-    BASE_URL = "https://www.safaribooksonline.com"
-    LOGIN_URL = BASE_URL + "/accounts/login/"
-    API_TEMPLATE = BASE_URL + "/api/v1/book/{0}/"
-
     BASE_01_HTML = "<!DOCTYPE html>\n" \
                    "<html lang=\"en\" xml:lang=\"en\" xmlns=\"http://www.w3.org/1999/xhtml\"" \
                    " xmlns:xsi=\"http://www.w3.org/2001/XMLSchema-instance\"" \
@@ -249,19 +253,19 @@ class SafariBooks:
                   "</package>"
 
     # Format: ID, Depth, Title, Author, NAVMAP
-    TOC_NCX = "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\" ?>" \
+    TOC_NCX = "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\" ?>\n" \
               "<!DOCTYPE ncx PUBLIC \"-//NISO//DTD ncx 2005-1//EN\"" \
-              " \"http://www.daisy.org/z3986/2005/ncx-2005-1.dtd\">" \
-              "<ncx xmlns=\"http://www.daisy.org/z3986/2005/ncx/\" version=\"2005-1\">" \
-              "<head>" \
-              "<meta content=\"ID:ISBN:{0}\" name=\"dtb:uid\"/>" \
-              "<meta content=\"{1}\" name=\"dtb:depth\"/>" \
-              "<meta content=\"0\" name=\"dtb:totalPageCount\"/>" \
-              "<meta content=\"0\" name=\"dtb:maxPageNumber\"/>" \
-              "</head>" \
-              "<docTitle><text>{2}</text></docTitle>" \
-              "<docAuthor><text>{3}</text></docAuthor>" \
-              "<navMap>{4}</navMap>" \
+              " \"http://www.daisy.org/z3986/2005/ncx-2005-1.dtd\">\n" \
+              "<ncx xmlns=\"http://www.daisy.org/z3986/2005/ncx/\" version=\"2005-1\">\n" \
+              "<head>\n" \
+              "<meta content=\"ID:ISBN:{0}\" name=\"dtb:uid\"/>\n" \
+              "<meta content=\"{1}\" name=\"dtb:depth\"/>\n" \
+              "<meta content=\"0\" name=\"dtb:totalPageCount\"/>\n" \
+              "<meta content=\"0\" name=\"dtb:maxPageNumber\"/>\n" \
+              "</head>\n" \
+              "<docTitle><text>{2}</text></docTitle>\n" \
+              "<docAuthor><text>{3}</text></docAuthor>\n" \
+              "<navMap>{4}</navMap>\n" \
               "</ncx>"
 
     def __init__(self, args):
@@ -364,7 +368,7 @@ def return_cookies(self):
         return " ".join(["{0}={1};".format(k, v) for k, v in self.cookies.items()])
 
     def return_headers(self, url):
-        if "safaribooksonline" in urlsplit(url).netloc:
+        if SAFARI_BASE_HOST in urlsplit(url).netloc:
             self.HEADERS["cookie"] = self.return_cookies()
 
         else:
@@ -441,10 +445,9 @@ def do_login(self, email, password):
             self.LOGIN_URL,
             post=True,
             data=(
-                ("csrfmiddlewaretoken", ""), ("csrfmiddlewaretoken", csrf),
+                ("csrfmiddlewaretoken", csrf),
                 ("email", email), ("password1", password),
-                ("is_login_form", "true"), ("leaveblank", ""),
-                ("dontchange", "http://")
+                ("login", "Sign In"), ("next", "")
             ),
             allow_redirects=False
         )
@@ -531,7 +534,7 @@ def get_html(self, url):
 
         root = None
         try:
-            root = html.fromstring(response.text, base_url=self.BASE_URL)
+            root = html.fromstring(response.text, base_url=SAFARI_BASE_URL)
 
         except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
             self.display.error(parsing_error)
@@ -591,7 +594,7 @@ def get_cover(html_root):
         return None
 
     def parse_html(self, root, first_page=False):
-        if random() > 0.5:
+        if random() > 0.8:
             if len(root.xpath("//div[@class='controls']/a/text()")):
                 self.display.exit(self.display.api_error(" "))
 
@@ -798,7 +801,7 @@ def _thread_download_images(self, url):
                 self.display.images_ad_info.value = 1
 
         else:
-            response = self.requests_provider(urljoin(self.BASE_URL, url),
+            response = self.requests_provider(urljoin(SAFARI_BASE_URL, url),
                                               update_cookies=False,
                                               stream=True)
             if response == 0:
@@ -1004,7 +1007,7 @@ def create_epub(self):
     arguments.add_argument(
         "bookid", metavar='<BOOK ID>',
         help="Book digits ID that you want to download. You can find it in the URL (X-es):"
-             " `https://www.safaribooksonline.com/library/view/book-name/XXXXXXXXXXXXX/`"
+             " `" + SAFARI_BASE_URL + "/library/view/book-name/XXXXXXXXXXXXX/`"
     )
 
     args_parsed = arguments.parse_args()

From acee92ddbe636c03e3750beb1cc118f2a56eea0c Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 3 Jan 2019 14:48:09 +0100
Subject: [PATCH 056/100] PEP8 and working for #57

---
 safaribooks.py | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 1f96b94..c066ffd 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -22,7 +22,6 @@
 SAFARI_BASE_URL = "https://" + SAFARI_BASE_HOST
 
 
-
 class Display:
     BASE_FORMAT = logging.Formatter(
         fmt="[%(asctime)s] %(message)s",
@@ -229,7 +228,7 @@ class SafariBooks:
                     "</container>"
 
     # Format: ID, Title, Authors, Description, Subjects, Publisher, Rights, Date, CoverId, MANIFEST, SPINE, CoverUrl
-    CONTENT_OPF = "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n" \
+    CONTENT_OPF = "<?xml version=\"1.0\" encoding=\"utf-8\"?>\n" \
                   "<package xmlns=\"http://www.idpf.org/2007/opf\" unique-identifier=\"bookid\" version=\"2.0\" >\n" \
                   "<metadata xmlns:dc=\"http://purl.org/dc/elements/1.1/\" " \
                   " xmlns:opf=\"http://www.idpf.org/2007/opf\">\n"\
@@ -253,7 +252,7 @@ class SafariBooks:
                   "</package>"
 
     # Format: ID, Depth, Title, Author, NAVMAP
-    TOC_NCX = "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\" ?>\n" \
+    TOC_NCX = "<?xml version=\"1.0\" encoding=\"utf-8\" standalone=\"no\" ?>\n" \
               "<!DOCTYPE ncx PUBLIC \"-//NISO//DTD ncx 2005-1//EN\"" \
               " \"http://www.daisy.org/z3986/2005/ncx-2005-1.dtd\">\n" \
               "<ncx xmlns=\"http://www.daisy.org/z3986/2005/ncx/\" version=\"2005-1\">\n" \
@@ -1013,11 +1012,11 @@ def create_epub(self):
     args_parsed = arguments.parse_args()
 
     if args_parsed.cred:
-        cred = SafariBooks.parse_cred(args_parsed.cred)
-        if not cred:
+        parsed_cred = SafariBooks.parse_cred(args_parsed.cred)
+        if not parsed_cred:
             arguments.error("invalid credential: %s" % args_parsed.cred)
 
-        args_parsed.cred = cred
+        args_parsed.cred = parsed_cred
 
     else:
         if args_parsed.no_cookies:

From 5de40909e0543e1bf43eae3cb88ea53fe6946a43 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 4 Jan 2019 14:46:30 +0100
Subject: [PATCH 057/100] Update README.md

---
 README.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/README.md b/README.md
index d9cbe86..dc6f458 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,7 @@
 # SafariBooks
 Download and generate *EPUB* of your favorite books from [*Safari Books Online*](https://www.safaribooksonline.com) library.  
 I'm not responsible for the use of this program, this is only for *personal* and *educational* purpose.  
+Before any usage please read the *O'Reilly*'s [Terms of Service](https://learning.oreilly.com/terms/).  
 
 ## Overview:
   * [Requirements & Setup](#requirements--setup)

From a238dee1be79d2d0df6aa6414b77afe2a06bd1cb Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 13 Feb 2019 23:38:42 +0100
Subject: [PATCH 058/100] Fix #16

---
 safaribooks.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index c066ffd..dae5cd5 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -61,10 +61,10 @@ def unregister(self):
         sys.excepthook = sys.__excepthook__
 
     def log(self, message):
-        self.logger.info(str(message).encode("utf-8", "replace"))
+        self.logger.info(message.encode("utf-8", "replace"))
 
     def out(self, put):
-        sys.stdout.write("\r" + " " * self.columns + "\r" + put + "\n")
+        sys.stdout.write("\r" + " " * self.columns + "\r" + put.encode("utf-8", "replace") + "\n")
 
     def info(self, message, state=False):
         self.log(message)

From 9938473f06b2dd3c729baf803df31bc233d9bece Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 13 Feb 2019 23:47:43 +0100
Subject: [PATCH 059/100] Fixes #63 and #64

---
 safaribooks.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index dae5cd5..2d64982 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -208,10 +208,11 @@ class SafariBooks:
                    "<head>\n" \
                    "{0}\n" \
                    "<style type=\"text/css\">" \
-                   "body{{background-color:#fbfbfb!important;margin:1em;}}" \
+                   "body{{margin:1em;}}" \
                    "#sbo-rt-content *{{text-indent:0pt!important;}}#sbo-rt-content .bq{{margin-right:1em!important;}}"
 
-    KINDLE_HTML = "#sbo-rt-content *{{word-wrap:break-word!important;" \
+    KINDLE_HTML = "body{{background-color:transparent!important;}}" \
+                  "#sbo-rt-content *{{word-wrap:break-word!important;" \
                   "word-break:break-word!important;}}#sbo-rt-content table,#sbo-rt-content pre" \
                   "{{overflow-x:unset!important;overflow:unset!important;" \
                   "overflow-y:unset!important;white-space:pre-wrap!important;}}"

From 421387891ef50d710382431ef40a06480a98355c Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Sun, 3 Mar 2019 08:50:41 -0800
Subject: [PATCH 060/100] Fixes #73, #74, #75, #76

---
 safaribooks.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 2d64982..40b3939 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -61,10 +61,10 @@ def unregister(self):
         sys.excepthook = sys.__excepthook__
 
     def log(self, message):
-        self.logger.info(message.encode("utf-8", "replace"))
+        self.logger.info(str(message, "utf-8", "replace"))
 
     def out(self, put):
-        sys.stdout.write("\r" + " " * self.columns + "\r" + put.encode("utf-8", "replace") + "\n")
+        sys.stdout.write("\r" + " " * self.columns + "\r" + str(put, "utf-8", "replace") + "\n")
 
     def info(self, message, state=False):
         self.log(message)

From 4b12f14fee61dd714cfcdc30be6ffcdb2b7b320f Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Sun, 3 Mar 2019 09:21:59 -0800
Subject: [PATCH 061/100] Fixes #77

---
 safaribooks.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 40b3939..d39beab 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -61,10 +61,10 @@ def unregister(self):
         sys.excepthook = sys.__excepthook__
 
     def log(self, message):
-        self.logger.info(str(message, "utf-8", "replace"))
+        self.logger.info(str(message))  # TODO: "utf-8", "replace"
 
     def out(self, put):
-        sys.stdout.write("\r" + " " * self.columns + "\r" + str(put, "utf-8", "replace") + "\n")
+        sys.stdout.write("\r" + " " * self.columns + "\r" + str(put) + "\n")  # TODO: "utf-8", "replace"
 
     def info(self, message, state=False):
         self.log(message)

From d4020bd5abe3453c3d2c66d59ee3e4f863bee256 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Sun, 3 Mar 2019 09:25:43 -0800
Subject: [PATCH 062/100] Create .gitignore

---
 .gitignore | 3 +++
 1 file changed, 3 insertions(+)
 create mode 100644 .gitignore

diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..7b13c80
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,3 @@
+Books/
+
+cookies.json

From 0cb04738e01d7bb65dbeb8c568585a5baec66313 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Sun, 3 Mar 2019 09:29:07 -0800
Subject: [PATCH 063/100] Closes #71

---
 .gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.gitignore b/.gitignore
index 7b13c80..3f84565 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,3 +1,4 @@
 Books/
 
 cookies.json
+*.log

From b1c0adafbf0fea2bed91bfb57295de76a98440bd Mon Sep 17 00:00:00 2001
From: Penley Chan <penleychan@gmail.com>
Date: Thu, 28 Mar 2019 18:27:37 -0600
Subject: [PATCH 064/100] add ':' to escape_dirname

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index d39beab..b52f431 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -693,7 +693,7 @@ def escape_dirname(dirname, clean_space=False):
             elif "win" in sys.platform:
                 dirname = dirname.replace(":", ",")
 
-        for ch in ['~', '#', '%', '&', '*', '{', '}', '\\', '<', '>', '?', '/', '`', '\'', '"', '|', '+']:
+        for ch in ['~', '#', '%', '&', '*', '{', '}', '\\', '<', '>', '?', '/', '`', '\'', '"', '|', '+', ':']:
             if ch in dirname:
                 dirname = dirname.replace(ch, "_")
 

From 87d98a2f81d87fa528917567f7d9fe036a0a4165 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <dependabot[bot]@users.noreply.github.com>
Date: Thu, 6 Jun 2019 17:01:47 +0000
Subject: [PATCH 065/100] Bump urllib3 from 1.24 to 1.24.2

Bumps [urllib3](https://github.com/urllib3/urllib3) from 1.24 to 1.24.2.
- [Release notes](https://github.com/urllib3/urllib3/releases)
- [Changelog](https://github.com/urllib3/urllib3/blob/master/CHANGES.rst)
- [Commits](https://github.com/urllib3/urllib3/compare/1.24...1.24.2)

Signed-off-by: dependabot[bot] <support@github.com>
---
 Pipfile.lock | 80 +++++++++++++++++++++++-----------------------------
 1 file changed, 35 insertions(+), 45 deletions(-)

diff --git a/Pipfile.lock b/Pipfile.lock
index ee72369..a69ad46 100644
--- a/Pipfile.lock
+++ b/Pipfile.lock
@@ -3,19 +3,6 @@
         "hash": {
             "sha256": "bdff55965f0e3fa7b2a9b0e9df281f33860d2ae44891a2916d0ae6ce1d8c4a19"
         },
-        "host-environment-markers": {
-            "implementation_name": "cpython",
-            "implementation_version": "3.6.5",
-            "os_name": "posix",
-            "platform_machine": "x86_64",
-            "platform_python_implementation": "CPython",
-            "platform_release": "4.15.0-36-generic",
-            "platform_system": "Linux",
-            "platform_version": "#39-Ubuntu SMP Mon Sep 24 16:19:09 UTC 2018",
-            "python_full_version": "3.6.5",
-            "python_version": "3.6",
-            "sys_platform": "linux"
-        },
         "pipfile-spec": 6,
         "requires": {
             "python_version": "3.6"
@@ -31,15 +18,15 @@
     "default": {
         "certifi": {
             "hashes": [
-                "sha256:339dc09518b07e2fa7eda5450740925974815557727d6bd35d319c1524a04a4c",
-                "sha256:6d58c986d22b038c8c0df30d639f23a3e6d172a05c3583e766f4c0b785c0986a"
+                "sha256:59b7658e26ca9c7339e00f8f4636cdfe59d34fa37b9b04f6f9e9926b3cece1a5",
+                "sha256:b26104d6835d1f5e49452a26eb2ff87fe7090b89dfcaee5ea2212697e1e1d7ae"
             ],
-            "version": "==2018.10.15"
+            "version": "==2019.3.9"
         },
         "chardet": {
             "hashes": [
-                "sha256:fc323ffcaeaed0e0a02bf4d117757b98aed530d9ed4531e3e15460124c106691",
-                "sha256:84ab92ed1c4d4f16916e05906b6b75a6c0fb5db821cc65e70cbd64a3e2a5eaae"
+                "sha256:84ab92ed1c4d4f16916e05906b6b75a6c0fb5db821cc65e70cbd64a3e2a5eaae",
+                "sha256:fc323ffcaeaed0e0a02bf4d117757b98aed530d9ed4531e3e15460124c106691"
             ],
             "version": "==3.0.4"
         },
@@ -52,52 +39,55 @@
         },
         "lxml": {
             "hashes": [
-                "sha256:fa39ea60d527fbdd94215b5e5552f1c6a912624521093f1384a491a8ad89ad8b",
-                "sha256:ae07fa0c115733fce1e9da96a3ac3fa24801742ca17e917e0c79d63a01eeb843",
-                "sha256:caf0e50b546bb60dfa99bb18dfa6748458a83131ecdceaf5c071d74907e7e78a",
-                "sha256:abf181934ac3ef193832fb973fd7f6149b5c531903c2ec0f1220941d73eee601",
-                "sha256:62939a8bb6758d1bf923aa1c13f0bcfa9bf5b2fc0f5fa917a6e25db5fe0cfa4e",
-                "sha256:4815892904c336bbaf73dafd54f45f69f4021c22b5bad7332176bbf4fb830568",
-                "sha256:81992565b74332c7c1aff6a913a3e906771aa81c9d0c68c68113cffcae45bc53",
                 "sha256:02bc220d61f46e9b9d5a53c361ef95e9f5e1d27171cd461dddb17677ae2289a5",
-                "sha256:bccb267678b870d9782c3b44d0cefe3ba0e329f9af8c946d32bf3778e7a4f271",
+                "sha256:22f253b542a342755f6cfc047fe4d3a296515cf9b542bc6e261af45a80b8caf6",
                 "sha256:2f31145c7ff665b330919bfa44aacd3a0211a76ca7e7b441039d2a0b0451e415",
-                "sha256:aab09fbe8abfa3b9ce62aaf45aca2d28726b1b9ee44871dbe644050a2fff4940",
-                "sha256:b9c78242219f674ab645ec571c9a95d70f381319a23911941cd2358a8e0521cf",
-                "sha256:a623965c086a6e91bb703d4da62dabe59fe88888e82c4117d544e11fd74835d6",
-                "sha256:9d862e3cf4fc1f2837dedce9c42269c8c76d027e49820a548ac89fdcee1e361f",
+                "sha256:36720698c29e7a9626a0dc802ef8885f8f0239bfd1689628ecd459a061f2807f",
+                "sha256:438a1b0203545521f6616132bfe0f4bca86f8a401364008b30e2b26ec408ce85",
+                "sha256:4815892904c336bbaf73dafd54f45f69f4021c22b5bad7332176bbf4fb830568",
                 "sha256:5be031b0f15ad63910d8e5038b489d95a79929513b3634ad4babf77100602588",
+                "sha256:5c93ae37c3c588e829b037fdfbd64a6e40c901d3f93f7beed6d724c44829a3ad",
+                "sha256:60842230678674cdac4a1cf0f707ef12d75b9a4fc4a565add4f710b5fcf185d5",
+                "sha256:62939a8bb6758d1bf923aa1c13f0bcfa9bf5b2fc0f5fa917a6e25db5fe0cfa4e",
                 "sha256:75830c06a62fe7b8fe3bbb5f269f0b308f19f3949ac81cfd40062f47c1455faf",
-                "sha256:a7783ab7f6a508b0510490cef9f857b763d796ba7476d9703f89722928d1e113",
-                "sha256:e16e07a0ec3a75b5ee61f2b1003c35696738f937dc8148fbda9fe2147ccb6e61",
-                "sha256:438a1b0203545521f6616132bfe0f4bca86f8a401364008b30e2b26ec408ce85",
+                "sha256:81992565b74332c7c1aff6a913a3e906771aa81c9d0c68c68113cffcae45bc53",
                 "sha256:8c892fb0ee52c594d9a7751c7d7356056a9682674b92cc1c4dc968ff0f30c52f",
+                "sha256:9d862e3cf4fc1f2837dedce9c42269c8c76d027e49820a548ac89fdcee1e361f",
+                "sha256:a623965c086a6e91bb703d4da62dabe59fe88888e82c4117d544e11fd74835d6",
+                "sha256:a7783ab7f6a508b0510490cef9f857b763d796ba7476d9703f89722928d1e113",
+                "sha256:aab09fbe8abfa3b9ce62aaf45aca2d28726b1b9ee44871dbe644050a2fff4940",
+                "sha256:abf181934ac3ef193832fb973fd7f6149b5c531903c2ec0f1220941d73eee601",
+                "sha256:ae07fa0c115733fce1e9da96a3ac3fa24801742ca17e917e0c79d63a01eeb843",
+                "sha256:b9c78242219f674ab645ec571c9a95d70f381319a23911941cd2358a8e0521cf",
+                "sha256:bccb267678b870d9782c3b44d0cefe3ba0e329f9af8c946d32bf3778e7a4f271",
                 "sha256:c4df4d27f4c93b2cef74579f00b1d3a31a929c7d8023f870c4b476f03a274db4",
-                "sha256:22f253b542a342755f6cfc047fe4d3a296515cf9b542bc6e261af45a80b8caf6",
+                "sha256:caf0e50b546bb60dfa99bb18dfa6748458a83131ecdceaf5c071d74907e7e78a",
+                "sha256:d3266bd3ac59ac4edcd5fa75165dee80b94a3e5c91049df5f7c057ccf097551c",
+                "sha256:db0d213987bcd4e6d41710fb4532b22315b0d8fb439ff901782234456556aed1",
+                "sha256:dbbd5cf7690a40a9f0a9325ab480d0fccf46d16b378eefc08e195d84299bfae1",
+                "sha256:e16e07a0ec3a75b5ee61f2b1003c35696738f937dc8148fbda9fe2147ccb6e61",
                 "sha256:e175a006725c7faadbe69e791877d09936c0ef2cf49d01b60a6c1efcb0e8be6f",
                 "sha256:edd9c13a97f6550f9da2236126bb51c092b3b1ce6187f2bd966533ad794bbb5e",
-                "sha256:dbbd5cf7690a40a9f0a9325ab480d0fccf46d16b378eefc08e195d84299bfae1",
-                "sha256:db0d213987bcd4e6d41710fb4532b22315b0d8fb439ff901782234456556aed1",
-                "sha256:60842230678674cdac4a1cf0f707ef12d75b9a4fc4a565add4f710b5fcf185d5",
-                "sha256:5c93ae37c3c588e829b037fdfbd64a6e40c901d3f93f7beed6d724c44829a3ad",
-                "sha256:d3266bd3ac59ac4edcd5fa75165dee80b94a3e5c91049df5f7c057ccf097551c",
-                "sha256:36720698c29e7a9626a0dc802ef8885f8f0239bfd1689628ecd459a061f2807f"
+                "sha256:fa39ea60d527fbdd94215b5e5552f1c6a912624521093f1384a491a8ad89ad8b"
             ],
+            "index": "pypi",
             "version": "==4.2.5"
         },
         "requests": {
             "hashes": [
-                "sha256:a84b8c9ab6239b578f22d1c21d51b696dcfe004032bb80ea832398d6909d7279",
-                "sha256:99dcfdaaeb17caf6e526f32b6a7b780461512ab3f1d992187801694cba42770c"
+                "sha256:99dcfdaaeb17caf6e526f32b6a7b780461512ab3f1d992187801694cba42770c",
+                "sha256:a84b8c9ab6239b578f22d1c21d51b696dcfe004032bb80ea832398d6909d7279"
             ],
+            "index": "pypi",
             "version": "==2.20.0"
         },
         "urllib3": {
             "hashes": [
-                "sha256:8819bba37a02d143296a4d032373c4dd4aca11f6d4c9973335ca75f9c8475f59",
-                "sha256:41c3db2fc01e5b907288010dec72f9d0a74e37d6994e6eb56849f59fea2265ae"
+                "sha256:4c291ca23bbb55c76518905869ef34bdd5f0e46af7afe6861e8375643ffee1a0",
+                "sha256:9a247273df709c4fedb38c711e44292304f73f39ab01beda9f6b9fc375669ac3"
             ],
-            "version": "==1.24"
+            "index": "pypi",
+            "version": "==1.24.2"
         }
     },
     "develop": {}

From 6a26453c1d534f4140da9350842c471f4df4d3cd Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 6 Jun 2019 19:02:21 +0200
Subject: [PATCH 066/100] Working on #94

---
 safaribooks.py | 81 ++++++++++++++++++++++++++++++++++----------------
 1 file changed, 56 insertions(+), 25 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index d39beab..6cde6af 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -18,8 +18,14 @@
 PATH = os.path.dirname(os.path.realpath(__file__))
 COOKIES_FILE = os.path.join(PATH, "cookies.json")
 
-SAFARI_BASE_HOST = "learning.oreilly.com"
+ORLY_BASE_HOST = "oreilly.com"  # PLEASE INSERT URL HERE
+
+SAFARI_BASE_HOST = "learning." + ORLY_BASE_HOST
+API_ORIGIN_HOST = "api." + ORLY_BASE_HOST
+
+ORLY_BASE_URL = "https://www." + ORLY_BASE_HOST
 SAFARI_BASE_URL = "https://" + SAFARI_BASE_HOST
+API_ORIGIN_URL = "https://" + API_ORIGIN_HOST
 
 
 class Display:
@@ -181,8 +187,9 @@ def qsize(self):
 
 
 class SafariBooks:
+    LOGIN_URL = ORLY_BASE_URL + "/member/auth/login/"
+    LOGIN_ENTRY_URL = SAFARI_BASE_URL + "/login/unified/?next=/home/"
 
-    LOGIN_URL = SAFARI_BASE_URL + "/accounts/login/"
     API_TEMPLATE = SAFARI_BASE_URL + "/api/v1/book/{0}/"
 
     HEADERS = {
@@ -193,7 +200,7 @@ class SafariBooks:
         "cookie": "",
         "pragma": "no-cache",
         "origin": SAFARI_BASE_URL,
-        "referer": LOGIN_URL,
+        "referer": LOGIN_ENTRY_URL,
         "upgrade-insecure-requests": "1",
         "user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
                       "Chrome/60.0.3112.113 Safari/537.36"
@@ -274,6 +281,7 @@ def __init__(self, args):
         self.display.intro()
 
         self.cookies = {}
+        self.jwt = {}
 
         if not args.cred:
             if not os.path.isfile(COOKIES_FILE):
@@ -368,7 +376,7 @@ def return_cookies(self):
         return " ".join(["{0}={1};".format(k, v) for k, v in self.cookies.items()])
 
     def return_headers(self, url):
-        if SAFARI_BASE_HOST in urlsplit(url).netloc:
+        if ORLY_BASE_HOST in urlsplit(url).netloc:
             self.HEADERS["cookie"] = self.return_cookies()
 
         else:
@@ -382,7 +390,7 @@ def update_cookies(self, jar):
                 cookie.name: cookie.value
             })
 
-    def requests_provider(self, url, post=False, data=None, update_cookies=True, **kwargs):
+    def requests_provider(self, url, post=False, data=None, update_cookies=True, update_referer=False, **kwargs):
         try:
             response = getattr(requests, "post" if post else "get")(
                 url,
@@ -404,6 +412,10 @@ def requests_provider(self, url, post=False, data=None, update_cookies=True, **k
         if update_cookies:
             self.update_cookies(response.cookies)
 
+        if update_referer:
+            # TODO Update Referer HTTP Header
+            pass
+
         return response
 
     @staticmethod
@@ -421,41 +433,41 @@ def parse_cred(cred):
         return new_cred
 
     def do_login(self, email, password):
-        response = self.requests_provider(self.LOGIN_URL)
+        response = self.requests_provider(self.LOGIN_ENTRY_URL, allow_redirects=False)
         if response == 0:
             self.display.exit("Login: unable to reach Safari Books Online. Try again...")
+        elif not response.is_redirect:
+            self.display.exit("Login: error? LOGIN-UPDATE-01")
 
-        csrf = []
-        try:
-            csrf = html.fromstring(response.text).xpath("//input[@name='csrfmiddlewaretoken'][@value]")
+        response = self.requests_provider(response.next.url, allow_redirects=False)
+        if response == 0:
+            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
+        elif not response.is_redirect:
+            self.display.error("Login: error? LOGIN-UPDATE-02")
 
-        except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
-            self.display.error(parsing_error)
-            self.display.exit(
-                "Login: error trying to parse the home of Safari Books Online."
-            )
+        response = self.requests_provider(response.next.url, allow_redirects=False)
+        if response == 0:
+            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
 
-        if not len(csrf):
-            self.display.exit("Login: no CSRF Token found in the page."
-                              " Unable to continue the login."
-                              " Try again...")
+        redirect_uri = response.request.path_url[response.request.path_url.index("redirect_uri"):]  # TODO try...catch
+        redirect_uri = redirect_uri[:redirect_uri.index("&")]
+        redirect_uri = "https://api.oreilly.com%2Fapi%2Fv1%2Fauth%2Fopenid%2Fauthorize%3F" + redirect_uri
 
-        csrf = csrf[0].attrib["value"]
         response = self.requests_provider(
             self.LOGIN_URL,
             post=True,
-            data=(
-                ("csrfmiddlewaretoken", csrf),
-                ("email", email), ("password1", password),
-                ("login", "Sign In"), ("next", "")
-            ),
+            json={
+                "email": email,
+                "password": password,
+                "redirect_uri": redirect_uri
+            },
             allow_redirects=False
         )
 
         if response == 0:
             self.display.exit("Login: unable to perform auth to Safari Books Online.\n    Try again...")
 
-        if response.status_code != 302:
+        if response.status_code != 200:  # TODO To be reviewed
             try:
                 error_page = html.fromstring(response.text)
                 errors_message = error_page.xpath("//ul[@class='errorlist']//li/text()")
@@ -473,6 +485,25 @@ def do_login(self, email, password):
                     " trying to parse the login details of Safari Books Online. Try again..."
                 )
 
+        self.jwt = response.json()  # TODO: save JWT Tokens and use the refresh_token to restore user session
+        response = self.requests_provider(self.jwt["redirect_uri"], allow_redirects=False)
+        if response == 0:
+            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
+        elif not response.is_redirect:
+            self.display.exit("Login: error? LOGIN-UPDATE-03")
+
+        response = self.requests_provider(response.next.url, allow_redirects=False)
+        if response == 0:
+            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
+        elif not response.is_redirect:
+            self.display.exit("Login: error? LOGIN-UPDATE-04")
+
+        response = self.requests_provider(response.next.url)
+        if response == 0:
+            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
+        elif not response.ok:
+            self.display.exit("Login: error? LOGIN-UPDATE-05")
+
     def get_book_info(self):
         response = self.requests_provider(self.api_url)
         if response == 0:

From 5927c3f88887da249e75f7dea7dfc2723ef00757 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 6 Jun 2019 23:37:11 +0200
Subject: [PATCH 067/100] Update fix for #94

---
 safaribooks.py | 43 ++++++++++++-------------------------------
 1 file changed, 12 insertions(+), 31 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 6cde6af..308cb59 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -390,12 +390,15 @@ def update_cookies(self, jar):
                 cookie.name: cookie.value
             })
 
-    def requests_provider(self, url, post=False, data=None, update_cookies=True, update_referer=False, **kwargs):
+    def requests_provider(
+            self, url, post=False, data=None, perfom_redirect=True, update_cookies=True, update_referer=True, **kwargs
+    ):
         try:
             response = getattr(requests, "post" if post else "get")(
                 url,
                 headers=self.return_headers(url),
                 data=data,
+                allow_redirects=False,
                 **kwargs
             )
 
@@ -414,7 +417,11 @@ def requests_provider(self, url, post=False, data=None, update_cookies=True, upd
 
         if update_referer:
             # TODO Update Referer HTTP Header
-            pass
+            self.HEADERS["referer"] = response.request.url
+
+        if response.is_redirect and perfom_redirect:
+            return self.requests_provider(response.next.url, post, None, perfom_redirect, update_cookies, update_referer)
+            # TODO How about **kwargs?
 
         return response
 
@@ -433,19 +440,7 @@ def parse_cred(cred):
         return new_cred
 
     def do_login(self, email, password):
-        response = self.requests_provider(self.LOGIN_ENTRY_URL, allow_redirects=False)
-        if response == 0:
-            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
-        elif not response.is_redirect:
-            self.display.exit("Login: error? LOGIN-UPDATE-01")
-
-        response = self.requests_provider(response.next.url, allow_redirects=False)
-        if response == 0:
-            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
-        elif not response.is_redirect:
-            self.display.error("Login: error? LOGIN-UPDATE-02")
-
-        response = self.requests_provider(response.next.url, allow_redirects=False)
+        response = self.requests_provider(self.LOGIN_ENTRY_URL)
         if response == 0:
             self.display.exit("Login: unable to reach Safari Books Online. Try again...")
 
@@ -461,7 +456,7 @@ def do_login(self, email, password):
                 "password": password,
                 "redirect_uri": redirect_uri
             },
-            allow_redirects=False
+            perfom_redirect=False
         )
 
         if response == 0:
@@ -486,23 +481,9 @@ def do_login(self, email, password):
                 )
 
         self.jwt = response.json()  # TODO: save JWT Tokens and use the refresh_token to restore user session
-        response = self.requests_provider(self.jwt["redirect_uri"], allow_redirects=False)
-        if response == 0:
-            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
-        elif not response.is_redirect:
-            self.display.exit("Login: error? LOGIN-UPDATE-03")
-
-        response = self.requests_provider(response.next.url, allow_redirects=False)
-        if response == 0:
-            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
-        elif not response.is_redirect:
-            self.display.exit("Login: error? LOGIN-UPDATE-04")
-
-        response = self.requests_provider(response.next.url)
+        response = self.requests_provider(self.jwt["redirect_uri"])
         if response == 0:
             self.display.exit("Login: unable to reach Safari Books Online. Try again...")
-        elif not response.ok:
-            self.display.exit("Login: error? LOGIN-UPDATE-05")
 
     def get_book_info(self):
         response = self.requests_provider(self.api_url)

From c33dfbbd31b14e40833a5ba8eee8c0d92c6d3483 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 6 Jun 2019 23:38:47 +0200
Subject: [PATCH 068/100] Update fix for #94

---
 safaribooks.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/safaribooks.py b/safaribooks.py
index 308cb59..31634db 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -417,6 +417,7 @@ def requests_provider(
 
         if update_referer:
             # TODO Update Referer HTTP Header
+            # TODO How about Origin? 
             self.HEADERS["referer"] = response.request.url
 
         if response.is_redirect and perfom_redirect:

From 1d446127e563470307db2c852601dbfe217b556d Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 14 Jun 2019 07:39:45 +0200
Subject: [PATCH 069/100] Fix #99

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index 31634db..d66730b 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -70,7 +70,7 @@ def log(self, message):
         self.logger.info(str(message))  # TODO: "utf-8", "replace"
 
     def out(self, put):
-        sys.stdout.write("\r" + " " * self.columns + "\r" + str(put) + "\n")  # TODO: "utf-8", "replace"
+        sys.stdout.write("\r" + " " * self.columns + "\r" + str(put, "utf-8", "replace") + "\n")
 
     def info(self, message, state=False):
         self.log(message)

From 0a835baa02846fc72968e8c7c514d00cbe2cb7ec Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 14 Jun 2019 07:41:59 +0200
Subject: [PATCH 070/100] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index dc6f458..f7fd760 100644
--- a/README.md
+++ b/README.md
@@ -25,7 +25,7 @@ $ pipenv install && pipenv shell
 The program depends of only two **Python 3** modules:
 ```python3
 lxml>=4.1.1
-requests>=2.18.4
+requests>=2.20.0
 ```
   
 ## Usage:

From a7513378c06db0adbead1eb04884f496c21ddbd4 Mon Sep 17 00:00:00 2001
From: Joel Junior <joeljunior05@hotmail.com>
Date: Sat, 13 Jul 2019 12:25:46 -0300
Subject: [PATCH 071/100] ignoring more folders

---
 .gitignore | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/.gitignore b/.gitignore
index 3f84565..260a1cc 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,3 +1,8 @@
+.idea/
+.vscode/
+.venv/
+.env/
+
 Books/
 
 cookies.json

From 71e7a47253fb960a458c8aeeaccc884c5dbcdc0f Mon Sep 17 00:00:00 2001
From: Gregory LEOCADIE <g.leocadie@criteo.com>
Date: Tue, 27 Aug 2019 09:47:19 +0200
Subject: [PATCH 072/100] Avoid retrieving truncated book
 chapters/pages/sections

When modifying the 'sessionid' after each call to oreilly api,
there are calls that are considered not-authenticated and we retrieved
truncated chapters/pages.
By avoiding adding/modifying it, all the calls are correctly authenticated
and we manage to retrieve full chapters/pages.
---
 safaribooks.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index d66730b..5ff43db 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -386,9 +386,10 @@ def return_headers(self, url):
 
     def update_cookies(self, jar):
         for cookie in jar:
-            self.cookies.update({
-                cookie.name: cookie.value
-            })
+            if cookie.name != 'sessionid':
+                self.cookies.update({
+                    cookie.name: cookie.value
+                })
 
     def requests_provider(
             self, url, post=False, data=None, perfom_redirect=True, update_cookies=True, update_referer=True, **kwargs

From 602f521b111aeae5141061bb189381d471d72a3b Mon Sep 17 00:00:00 2001
From: Povilas Balzaravicius Pawka <pavvka@gmail.com>
Date: Wed, 9 Oct 2019 09:27:26 +0300
Subject: [PATCH 073/100] Fix TypeError when printing color codes to stdout

---
 safaribooks.py | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index d66730b..c144666 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -70,7 +70,13 @@ def log(self, message):
         self.logger.info(str(message))  # TODO: "utf-8", "replace"
 
     def out(self, put):
-        sys.stdout.write("\r" + " " * self.columns + "\r" + str(put, "utf-8", "replace") + "\n")
+        pattern = "\r{!s}\r{!s}\n"
+        try:
+            s = pattern.format(
+                " " * self.columns, str(put, "utf-8", "replace"))
+        except TypeError:
+            s = pattern.format(" " * self.columns, put)
+        sys.stdout.write(s)
 
     def info(self, message, state=False):
         self.log(message)
@@ -417,7 +423,7 @@ def requests_provider(
 
         if update_referer:
             # TODO Update Referer HTTP Header
-            # TODO How about Origin? 
+            # TODO How about Origin?
             self.HEADERS["referer"] = response.request.url
 
         if response.is_redirect and perfom_redirect:

From 2611c265731acc06ca2c8fd931145845f24c0e81 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 14 Oct 2019 00:17:47 +0200
Subject: [PATCH 074/100] Closes #144 Closes #139 Closes #130 Closes #129
 Closes #115 PR Closed #107 Closes #106 Closes #103 PR Closed #102 Closes #101
 Closes #94 PR Closed #93 PR Closed #85 PR Closed #81

---
 README.md      |   8 ++--
 safaribooks.py | 114 ++++++++++++++++++++++++++++++++-----------------
 2 files changed, 80 insertions(+), 42 deletions(-)

diff --git a/README.md b/README.md
index f7fd760..92fb558 100644
--- a/README.md
+++ b/README.md
@@ -44,7 +44,7 @@ Like: `https://www.safaribooksonline.com/library/view/test-driven-development-wi
 #### Program options:
 ```shell
 $ python3 safaribooks.py --help
-usage: safaribooks.py [--cred <EMAIL:PASS>] [--no-cookies] [--no-kindle]
+usage: safaribooks.py [--cred <EMAIL:PASS> | --login] [--no-cookies] [--no-kindle]
                       [--preserve-log] [--help]
                       <BOOK ID>
 
@@ -60,6 +60,8 @@ optional arguments:
   --cred <EMAIL:PASS>  Credentials used to perform the auth login on Safari
                        Books Online.
                        Es. ` --cred "account_mail@mail.com:password01" `.
+  --login              Prompt for credentials used to perform the auth login
+                       on Safari Books Online.
   --no-cookies         Prevent your session data to be saved into
                        `cookies.json` file.
   --no-kindle          Remove some CSS rules that block overflow on `table`
@@ -74,9 +76,9 @@ The first time you use the program, you'll have to specify your Safari Books Onl
 The next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json` (for **SSO** look the file format [`here`](/../../issues/2#issuecomment-367726544)). 
   
 Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
-If you don't want to cache the cookies, just use the `--no-cookies` option and provide all time your `--cred`.
+If you don't want to cache the cookies, just use the `--no-cookies` option and provide all time your `--cred` to perform `--login`.
 
-You can configure proxies by setting on your system the environment variables `HTTP_PROXY` and `HTTPS_PROXY`.
+You can configure proxies by setting on your system the environment variable `HTTPS_PROXY`.
 
 The program default options are thought for ensure best compatibilities for who want to export the `EPUB` to E-Readers like Amazon Kindle. If you want to do it, I suggest you to convert the `EPUB` to `AZW3` with [Calibre](https://calibre-ebook.com/).  
 You can also convert the book to `MOBI` and if you'll do it with Calibre be sure to select `Ignore margins` in the conversion options:  
diff --git a/safaribooks.py b/safaribooks.py
index e11191a..38873a0 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -4,6 +4,7 @@
 import sys
 import json
 import shutil
+import getpass
 import logging
 import argparse
 import requests
@@ -40,6 +41,8 @@ class Display:
     SH_BG_YELLOW = "\033[43m" if "win" not in sys.platform else ""
 
     def __init__(self, log_file):
+        self.output_dir = ""
+        self.output_dir_set = False
         self.log_file = os.path.join(PATH, log_file)
 
         self.logger = logging.getLogger("SafariBooks")
@@ -62,6 +65,11 @@ def __init__(self, log_file):
         self.state_status = Value("i", 0)
         sys.excepthook = self.unhandled_exception
 
+    def set_output_dir(self, output_dir):
+        self.info("Output directory:\n    %s" % output_dir)
+        self.output_dir = output_dir
+        self.output_dir_set = True
+
     def unregister(self):
         self.logger.handlers[0].close()
         sys.excepthook = sys.__excepthook__
@@ -72,10 +80,11 @@ def log(self, message):
     def out(self, put):
         pattern = "\r{!s}\r{!s}\n"
         try:
-            s = pattern.format(
-                " " * self.columns, str(put, "utf-8", "replace"))
+            s = pattern.format(" " * self.columns, str(put, "utf-8", "replace"))
+
         except TypeError:
             s = pattern.format(" " * self.columns, put)
+
         sys.stdout.write(s)
 
     def info(self, message, state=False):
@@ -94,10 +103,12 @@ def error(self, error):
 
     def exit(self, error):
         self.error(str(error))
-        output = (self.SH_YELLOW + "[+]" + self.SH_DEFAULT +
-                  " Please delete all the `<BOOK NAME>/OEBPS/*.xhtml`"
-                  " files and restart the program.")
-        self.out(output)
+
+        if self.output_dir_set:
+            output = (self.SH_YELLOW + "[+]" + self.SH_DEFAULT +
+                      " Please delete the output directory '" + self.output_dir + "'"
+                      " and restart the program.")
+            self.out(output)
 
         output = self.SH_BG_RED + "[!]" + self.SH_DEFAULT + " Aborting..."
         self.out(output)
@@ -115,15 +126,22 @@ def save_last_request(self):
                      .format(*self.last_request))
 
     def intro(self):
-        output = self.SH_YELLOW + """
-       ____     ___         _
-      / __/__ _/ _/__ _____(_)
-     _\ \/ _ `/ _/ _ `/ __/ /
-    /___/\_,_/_/ \_,_/_/ /_/
-      / _ )___  ___  / /__ ___
-     / _  / _ \/ _ \/  '_/(_-<
-    /____/\___/\___/_/\_\/___/
-""" + self.SH_DEFAULT
+        output = self.SH_YELLOW + ("""
+       ____     ___         _     
+      / __/__ _/ _/__ _____(_)    
+     _\ \/ _ `/ _/ _ `/ __/ /     
+    /___/\_,_/_/ \_,_/_/ /_/      
+      / _ )___  ___  / /__ ___    
+     / _  / _ \/ _ \/  '_/(_-<    
+    /____/\___/\___/_/\_\/___/    
+""" if random() > 0.5 else """
+ ██████╗     ██████╗ ██╗  ██╗   ██╗██████╗ 
+██╔═══██╗    ██╔══██╗██║  ╚██╗ ██╔╝╚════██╗
+██║   ██║    ██████╔╝██║   ╚████╔╝   ▄███╔╝
+██║   ██║    ██╔══██╗██║    ╚██╔╝    ▀▀══╝ 
+╚██████╔╝    ██║  ██║███████╗██║     ██╗   
+ ╚═════╝     ╚═╝  ╚═╝╚══════╝╚═╝     ╚═╝                                           
+""") + self.SH_DEFAULT
         output += "\n" + "~" * (self.columns // 2)
 
         self.out(output)
@@ -179,7 +197,7 @@ def api_error(response):
             os.remove(COOKIES_FILE)
             message += "Out-of-Session%s.\n" % (" (%s)" % response["detail"]) if "detail" in response else "" +\
                        Display.SH_YELLOW + "[+]" + Display.SH_DEFAULT + \
-                       " Use the `--cred` option in order to perform the auth login to Safari Books Online."
+                       " Use the `--cred` or `--login` options in order to perform the auth login to Safari."
 
         return message
 
@@ -292,7 +310,7 @@ def __init__(self, args):
         if not args.cred:
             if not os.path.isfile(COOKIES_FILE):
                 self.display.exit("Login: unable to find cookies file.\n"
-                                  "    Please use the --cred option to perform the login.")
+                                  "    Please use the `--cred` or `--login` options to perform the login.")
 
             self.cookies = json.load(open(COOKIES_FILE))
 
@@ -328,10 +346,10 @@ def __init__(self, args):
             os.mkdir(books_dir)
 
         self.BOOK_PATH = os.path.join(books_dir, self.clean_book_title)
+        self.display.set_output_dir(self.BOOK_PATH)
         self.css_path = ""
         self.images_path = ""
         self.create_dirs()
-        self.display.info("Output directory:\n    %s" % self.BOOK_PATH)
 
         self.chapter_title = ""
         self.filename = ""
@@ -376,8 +394,6 @@ def __init__(self, args):
         if not self.display.in_error and not args.log:
             os.remove(self.display.log_file)
 
-        sys.exit(0)
-
     def return_cookies(self):
         return " ".join(["{0}={1};".format(k, v) for k, v in self.cookies.items()])
 
@@ -392,7 +408,7 @@ def return_headers(self, url):
 
     def update_cookies(self, jar):
         for cookie in jar:
-            if cookie.name != 'sessionid':
+            if cookie.name != 'sessionid':  # TODO
                 self.cookies.update({
                     cookie.name: cookie.value
                 })
@@ -570,7 +586,7 @@ def url_is_absolute(url):
         return bool(urlparse(url).netloc)
 
     def link_replace(self, link):
-        if link:
+        if link and not link.startswith("mailto"):
             if not self.url_is_absolute(link):
                 if "cover" in link or "images" in link or "graphics" in link or \
                         link[-3:] in ["jpg", "peg", "png", "gif"]:
@@ -770,9 +786,10 @@ def get(self):
                 if not self.display.book_ad_info and \
                         next_chapter not in self.book_chapters[:self.book_chapters.index(next_chapter)]:
                     self.display.info(
-                        "File `%s` already exists.\n"
-                        "    If you want to download again all the book%s,\n"
-                        "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program." %
+                        ("File `%s` already exists.\n"
+                         "    If you want to download again all the book%s,\n"
+                         "    please delete the output directory '" + self.BOOK_PATH + "' and restart the program.")
+                        %
                         (
                             self.filename.replace(".html", ".xhtml"),
                             " (especially because you selected the `--no-kindle` option)"
@@ -790,10 +807,10 @@ def _thread_download_css(self, url):
         css_file = os.path.join(self.css_path, "Style{0:0>2}.css".format(self.css.index(url)))
         if os.path.isfile(css_file):
             if not self.display.css_ad_info.value and url not in self.css[:self.css.index(url)]:
-                self.display.info("File `%s` already exists.\n"
-                                  "    If you want to download again all the CSSs,\n"
-                                  "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` and `<BOOK NAME>/OEBPS/Styles/*`"
-                                  " files and restart the program." %
+                self.display.info(("File `%s` already exists.\n"
+                                   "    If you want to download again all the CSSs,\n"
+                                   "    please delete the output directory '" + self.BOOK_PATH + "'"
+                                   " and restart the program.") %
                                   css_file)
                 self.display.css_ad_info.value = 1
 
@@ -813,10 +830,10 @@ def _thread_download_images(self, url):
         image_path = os.path.join(self.images_path, image_name)
         if os.path.isfile(image_path):
             if not self.display.images_ad_info.value and url not in self.images[:self.images.index(url)]:
-                self.display.info("File `%s` already exists.\n"
-                                  "    If you want to download again all the images,\n"
-                                  "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` and `<BOOK NAME>/OEBPS/Images/*`"
-                                  " files and restart the program." %
+                self.display.info(("File `%s` already exists.\n"
+                                   "    If you want to download again all the images,\n"
+                                   "    please delete the output directory '" + self.BOOK_PATH + "'"
+                                   " and restart the program.") %
                                   image_name)
                 self.display.images_ad_info.value = 1
 
@@ -862,7 +879,7 @@ def collect_images(self):
         if self.display.book_ad_info == 2:
             self.display.info("Some of the book contents were already downloaded.\n"
                               "    If you want to be sure that all the images will be downloaded,\n"
-                              "    please delete the `<BOOK NAME>/OEBPS/*.xhtml` files and restart the program.")
+                              "    please delete the output direcotry '" + self.BOOK_PATH + "' and restart the program.")
 
         self.display.state_status.value = -1
 
@@ -914,7 +931,7 @@ def create_content_opf(self):
             escape(self.book_info["description"]),
             subjects,
             ", ".join(escape(pub["name"]) for pub in self.book_info["publishers"]),
-            escape(self.book_info["rights"]),
+            escape(self.book_info["rights"]) if self.book_info["rights"] else "",
             self.book_info["issued"],
             self.cover,
             "\n".join(manifest),
@@ -1005,11 +1022,17 @@ def create_epub(self):
                                         add_help=False,
                                         allow_abbrev=False)
 
-    arguments.add_argument(
+    login_arg_group = arguments.add_mutually_exclusive_group()
+    login_arg_group.add_argument(
         "--cred", metavar="<EMAIL:PASS>", default=False,
         help="Credentials used to perform the auth login on Safari Books Online."
              " Es. ` --cred \"account_mail@mail.com:password01\" `."
     )
+    login_arg_group.add_argument(
+        "--login", action='store_true',
+        help="Prompt for credentials used to perform the auth login on Safari Books Online."
+    )
+
     arguments.add_argument(
         "--no-cookies", dest="no_cookies", action='store_true',
         help="Prevent your session data to be saved into `cookies.json` file."
@@ -1032,10 +1055,22 @@ def create_epub(self):
 
     args_parsed = arguments.parse_args()
 
-    if args_parsed.cred:
-        parsed_cred = SafariBooks.parse_cred(args_parsed.cred)
+    if args_parsed.cred or args_parsed.login:
+        email = ""
+        pre_cred = ""
+
+        if args_parsed.cred:
+            pre_cred = args_parsed.cred
+
+        else:
+            email = input("Email: ")
+            passwd = getpass.getpass("Password: ")
+            pre_cred = email + ":" + passwd
+
+        parsed_cred = SafariBooks.parse_cred(pre_cred)
+
         if not parsed_cred:
-            arguments.error("invalid credential: %s" % args_parsed.cred)
+            arguments.error("invalid credential: %s" % (args_parsed.cred if args_parsed.cred else (email + ":*******")))
 
         args_parsed.cred = parsed_cred
 
@@ -1044,3 +1079,4 @@ def create_epub(self):
             arguments.error("invalid option: `--no-cookies` is valid only if you use the `--cred` option")
 
     SafariBooks(args_parsed)
+    sys.exit(0)

From 2eca1ed437164107915145844b143d0df2183a0a Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 22 Nov 2019 00:04:35 +0100
Subject: [PATCH 075/100] Working on #150

Fixes #109
Closing #152
Closing #153
Closing #154
Working on #150

Thanks to: @elrob, @McPatate and @cgimenes
---
 safaribooks.py | 164 ++++++++++++++++++++++++++-----------------------
 1 file changed, 86 insertions(+), 78 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 38873a0..8647477 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -1,5 +1,6 @@
 #!/usr/bin/env python3
 # coding: utf-8
+import re
 import os
 import sys
 import json
@@ -9,11 +10,11 @@
 import argparse
 import requests
 import traceback
-from lxml import html, etree
 from html import escape
 from random import random
+from lxml import html, etree
 from multiprocessing import Process, Queue, Value
-from urllib.parse import urljoin, urlsplit, urlparse
+from urllib.parse import urljoin, urlparse, parse_qs, quote_plus
 
 
 PATH = os.path.dirname(os.path.realpath(__file__))
@@ -27,6 +28,7 @@
 ORLY_BASE_URL = "https://www." + ORLY_BASE_HOST
 SAFARI_BASE_URL = "https://" + SAFARI_BASE_HOST
 API_ORIGIN_URL = "https://" + API_ORIGIN_HOST
+PROFILE_URL = SAFARI_BASE_URL + "/profile/"
 
 
 class Display:
@@ -75,7 +77,11 @@ def unregister(self):
         sys.excepthook = sys.__excepthook__
 
     def log(self, message):
-        self.logger.info(str(message))  # TODO: "utf-8", "replace"
+        try:
+            self.logger.info(str(message, "utf-8", "replace"))
+
+        except (UnicodeDecodeError, Exception):
+            self.logger.info(message)
 
     def out(self, put):
         pattern = "\r{!s}\r{!s}\n"
@@ -195,7 +201,7 @@ def api_error(response):
 
         else:
             os.remove(COOKIES_FILE)
-            message += "Out-of-Session%s.\n" % (" (%s)" % response["detail"]) if "detail" in response else "" +\
+            message += "Out-of-Session%s.\n" % (" (%s)" % response["detail"]) if "detail" in response else "" + \
                        Display.SH_YELLOW + "[+]" + Display.SH_DEFAULT + \
                        " Use the `--cred` or `--login` options in order to perform the auth login to Safari."
 
@@ -216,20 +222,6 @@ class SafariBooks:
 
     API_TEMPLATE = SAFARI_BASE_URL + "/api/v1/book/{0}/"
 
-    HEADERS = {
-        "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8",
-        "accept-encoding": "gzip, deflate",
-        "accept-language": "it-IT,it;q=0.9,en-US;q=0.8,en;q=0.7",
-        "cache-control": "no-cache",
-        "cookie": "",
-        "pragma": "no-cache",
-        "origin": SAFARI_BASE_URL,
-        "referer": LOGIN_ENTRY_URL,
-        "upgrade-insecure-requests": "1",
-        "user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
-                      "Chrome/60.0.3112.113 Safari/537.36"
-    }
-
     BASE_01_HTML = "<!DOCTYPE html>\n" \
                    "<html lang=\"en\" xml:lang=\"en\" xmlns=\"http://www.w3.org/1999/xhtml\"" \
                    " xmlns:xsi=\"http://www.w3.org/2001/XMLSchema-instance\"" \
@@ -263,7 +255,7 @@ class SafariBooks:
     CONTENT_OPF = "<?xml version=\"1.0\" encoding=\"utf-8\"?>\n" \
                   "<package xmlns=\"http://www.idpf.org/2007/opf\" unique-identifier=\"bookid\" version=\"2.0\" >\n" \
                   "<metadata xmlns:dc=\"http://purl.org/dc/elements/1.1/\" " \
-                  " xmlns:opf=\"http://www.idpf.org/2007/opf\">\n"\
+                  " xmlns:opf=\"http://www.idpf.org/2007/opf\">\n" \
                   "<dc:title>{1}</dc:title>\n" \
                   "{2}\n" \
                   "<dc:description>{3}</dc:description>\n" \
@@ -299,12 +291,26 @@ class SafariBooks:
               "<navMap>{4}</navMap>\n" \
               "</ncx>"
 
+    HEADERS = {
+        "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8",
+        "accept-encoding": "gzip, deflate",
+        "origin": SAFARI_BASE_URL,
+        "referer": LOGIN_ENTRY_URL,
+        "upgrade-insecure-requests": "1",
+        "user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
+                      "Chrome/60.0.3112.113 Safari/537.36"
+    }
+
+    COOKIE_FLOAT_MAX_AGE_PATTERN = re.compile(r'(max-age=\d*\.\d*)', re.IGNORECASE)
+
     def __init__(self, args):
         self.args = args
         self.display = Display("info_%s.log" % escape(args.bookid))
         self.display.intro()
 
-        self.cookies = {}
+        self.session = requests.Session()
+        self.session.headers.update(self.HEADERS)
+
         self.jwt = {}
 
         if not args.cred:
@@ -312,13 +318,15 @@ def __init__(self, args):
                 self.display.exit("Login: unable to find cookies file.\n"
                                   "    Please use the `--cred` or `--login` options to perform the login.")
 
-            self.cookies = json.load(open(COOKIES_FILE))
+            self.session.cookies.update(json.load(open(COOKIES_FILE)))
 
         else:
             self.display.info("Logging into Safari Books Online...", state=True)
             self.do_login(*args.cred)
             if not args.no_cookies:
-                json.dump(self.cookies, open(COOKIES_FILE, "w"))
+                json.dump(self.session.cookies.get_dict(), open(COOKIES_FILE, 'w'))
+
+        self.check_login()
 
         self.book_id = args.bookid
         self.api_url = self.API_TEMPLATE.format(self.book_id)
@@ -386,7 +394,7 @@ def __init__(self, args):
         self.create_epub()
 
         if not args.no_cookies:
-            json.dump(self.cookies, open(COOKIES_FILE, "w"))
+            json.dump(self.session.cookies.get_dict(), open(COOKIES_FILE, "w"))
 
         self.display.done(os.path.join(self.BOOK_PATH, self.book_id + ".epub"))
         self.display.unregister()
@@ -394,37 +402,24 @@ def __init__(self, args):
         if not self.display.in_error and not args.log:
             os.remove(self.display.log_file)
 
-    def return_cookies(self):
-        return " ".join(["{0}={1};".format(k, v) for k, v in self.cookies.items()])
-
-    def return_headers(self, url):
-        if ORLY_BASE_HOST in urlsplit(url).netloc:
-            self.HEADERS["cookie"] = self.return_cookies()
-
-        else:
-            self.HEADERS["cookie"] = ""
-
-        return self.HEADERS
-
-    def update_cookies(self, jar):
-        for cookie in jar:
-            if cookie.name != 'sessionid':  # TODO
-                self.cookies.update({
-                    cookie.name: cookie.value
-                })
+    def handle_cookie_update(self, set_cookie_headers):
+        for morsel in set_cookie_headers:
+            # Handle Float 'max-age' Cookie
+            if self.COOKIE_FLOAT_MAX_AGE_PATTERN.search(morsel):
+                cookie_key, cookie_value = morsel.split(";")[0].split("=")
+                self.session.cookies.set(cookie_key, cookie_value)
 
-    def requests_provider(
-            self, url, post=False, data=None, perfom_redirect=True, update_cookies=True, update_referer=True, **kwargs
-    ):
+    def requests_provider(self, url, is_post=False, data=None, perform_redirect=True, **kwargs):
         try:
-            response = getattr(requests, "post" if post else "get")(
+            response = getattr(self.session, "post" if is_post else "get")(
                 url,
-                headers=self.return_headers(url),
                 data=data,
                 allow_redirects=False,
                 **kwargs
             )
 
+            self.handle_cookie_update(response.raw.headers.getlist("Set-Cookie"))
+
             self.display.last_request = (
                 url, data, kwargs, response.status_code, "\n".join(
                     ["\t{}: {}".format(*h) for h in response.headers.items()]
@@ -435,16 +430,8 @@ def requests_provider(
             self.display.error(str(request_exception))
             return 0
 
-        if update_cookies:
-            self.update_cookies(response.cookies)
-
-        if update_referer:
-            # TODO Update Referer HTTP Header
-            # TODO How about Origin?
-            self.HEADERS["referer"] = response.request.url
-
-        if response.is_redirect and perfom_redirect:
-            return self.requests_provider(response.next.url, post, None, perfom_redirect, update_cookies, update_referer)
+        if response.is_redirect and perform_redirect:
+            return self.requests_provider(response.next.url, is_post, None, perform_redirect)
             # TODO How about **kwargs?
 
         return response
@@ -468,19 +455,24 @@ def do_login(self, email, password):
         if response == 0:
             self.display.exit("Login: unable to reach Safari Books Online. Try again...")
 
-        redirect_uri = response.request.path_url[response.request.path_url.index("redirect_uri"):]  # TODO try...catch
-        redirect_uri = redirect_uri[:redirect_uri.index("&")]
-        redirect_uri = "https://api.oreilly.com%2Fapi%2Fv1%2Fauth%2Fopenid%2Fauthorize%3F" + redirect_uri
+        next_parameter = None
+        try:
+            next_parameter = parse_qs(urlparse(response.request.url).query)["next"][0]
+
+        except (AttributeError, ValueError, IndexError):
+            self.display.exit("Login: unable to complete login on Safari Books Online. Try again...")
+
+        redirect_uri = API_ORIGIN_URL + quote_plus(next_parameter)
 
         response = self.requests_provider(
             self.LOGIN_URL,
-            post=True,
+            is_post=True,
             json={
                 "email": email,
                 "password": password,
                 "redirect_uri": redirect_uri
             },
-            perfom_redirect=False
+            perform_redirect=False
         )
 
         if response == 0:
@@ -492,11 +484,14 @@ def do_login(self, email, password):
                 errors_message = error_page.xpath("//ul[@class='errorlist']//li/text()")
                 recaptcha = error_page.xpath("//div[@class='g-recaptcha']")
                 messages = (["    `%s`" % error for error in errors_message
-                            if "password" in error or "email" in error] if len(errors_message) else []) +\
-                           (["    `ReCaptcha required (wait or do logout from the website).`"] if len(recaptcha) else[])
-                self.display.exit("Login: unable to perform auth login to Safari Books Online.\n" +
-                                  self.display.SH_YELLOW + "[*]" + self.display.SH_DEFAULT + " Details:\n"
-                                  "%s" % "\n".join(messages if len(messages) else ["    Unexpected error!"]))
+                             if "password" in error or "email" in error] if len(errors_message) else []) + \
+                           (["    `ReCaptcha required (wait or do logout from the website).`"] if len(
+                               recaptcha) else [])
+                self.display.exit(
+                    "Login: unable to perform auth login to Safari Books Online.\n" + self.display.SH_YELLOW +
+                    "[*]" + self.display.SH_DEFAULT + " Details:\n" + "%s" % "\n".join(
+                        messages if len(messages) else ["    Unexpected error!"])
+                )
             except (html.etree.ParseError, html.etree.ParserError) as parsing_error:
                 self.display.error(parsing_error)
                 self.display.exit(
@@ -509,6 +504,17 @@ def do_login(self, email, password):
         if response == 0:
             self.display.exit("Login: unable to reach Safari Books Online. Try again...")
 
+    def check_login(self):
+        response = self.requests_provider(PROFILE_URL, perform_redirect=False)
+
+        if response == 0:
+            self.display.exit("Login: unable to reach Safari Books Online. Try again...")
+
+        if response.status_code != 200:
+            self.display.exit("Authentication issue: unable to access profile page.")
+
+        self.display.info("Successfully authenticated.", state=True)
+
     def get_book_info(self):
         response = self.requests_provider(self.api_url)
         if response == 0:
@@ -548,7 +554,7 @@ def get_book_chapters(self, page=1):
         return result + (self.get_book_chapters(page + 1) if response["next"] else [])
 
     def get_default_cover(self):
-        response = self.requests_provider(self.book_info["cover"], update_cookies=False, stream=True)
+        response = self.requests_provider(self.book_info["cover"], stream=True)
         if response == 0:
             self.display.error("Error trying to retrieve the cover: %s" % self.book_info["cover"])
             return False
@@ -765,7 +771,7 @@ def create_dirs(self):
 
     def save_page_html(self, contents):
         self.filename = self.filename.replace(".html", ".xhtml")
-        open(os.path.join(self.BOOK_PATH, "OEBPS", self.filename), "wb")\
+        open(os.path.join(self.BOOK_PATH, "OEBPS", self.filename), "wb") \
             .write(self.BASE_HTML.format(contents[0], contents[1]).encode("utf-8", 'xmlcharrefreplace'))
         self.display.log("Created: %s" % self.filename)
 
@@ -815,7 +821,7 @@ def _thread_download_css(self, url):
                 self.display.css_ad_info.value = 1
 
         else:
-            response = self.requests_provider(url, update_cookies=False)
+            response = self.requests_provider(url)
             if response == 0:
                 self.display.error("Error trying to retrieve this CSS: %s\n    From: %s" % (css_file, url))
 
@@ -838,9 +844,7 @@ def _thread_download_images(self, url):
                 self.display.images_ad_info.value = 1
 
         else:
-            response = self.requests_provider(urljoin(SAFARI_BASE_URL, url),
-                                              update_cookies=False,
-                                              stream=True)
+            response = self.requests_provider(urljoin(SAFARI_BASE_URL, url), stream=True)
             if response == 0:
                 self.display.error("Error trying to retrieve this image: %s\n    From: %s" % (image_name, url))
 
@@ -854,7 +858,7 @@ def _thread_download_images(self, url):
     def _start_multiprocessing(self, operation, full_queue):
         if len(full_queue) > 5:
             for i in range(0, len(full_queue), 5):
-                self._start_multiprocessing(operation, full_queue[i:i+5])
+                self._start_multiprocessing(operation, full_queue[i:i + 5])
 
         else:
             process_queue = [Process(target=operation, args=(arg,)) for arg in full_queue]
@@ -879,7 +883,8 @@ def collect_images(self):
         if self.display.book_ad_info == 2:
             self.display.info("Some of the book contents were already downloaded.\n"
                               "    If you want to be sure that all the images will be downloaded,\n"
-                              "    please delete the output direcotry '" + self.BOOK_PATH + "' and restart the program.")
+                              "    please delete the output direcotry '" + self.BOOK_PATH +
+                              "' and restart the program.")
 
         self.display.state_status.value = -1
 
@@ -1056,21 +1061,23 @@ def create_epub(self):
     args_parsed = arguments.parse_args()
 
     if args_parsed.cred or args_parsed.login:
-        email = ""
+        user_email = ""
         pre_cred = ""
 
         if args_parsed.cred:
             pre_cred = args_parsed.cred
 
         else:
-            email = input("Email: ")
+            user_email = input("Email: ")
             passwd = getpass.getpass("Password: ")
-            pre_cred = email + ":" + passwd
+            pre_cred = user_email + ":" + passwd
 
         parsed_cred = SafariBooks.parse_cred(pre_cred)
 
         if not parsed_cred:
-            arguments.error("invalid credential: %s" % (args_parsed.cred if args_parsed.cred else (email + ":*******")))
+            arguments.error("invalid credential: %s" % (
+                args_parsed.cred if args_parsed.cred else (user_email + ":*******")
+            ))
 
         args_parsed.cred = parsed_cred
 
@@ -1079,4 +1086,5 @@ def create_epub(self):
             arguments.error("invalid option: `--no-cookies` is valid only if you use the `--cred` option")
 
     SafariBooks(args_parsed)
+    # Hint: do you want to download more then one book once, initialized more than one instance of `SafariBooks`...
     sys.exit(0)

From 524d78ed20c6ed8920baf8c5f09563a6d0243221 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Mon, 9 Dec 2019 12:29:53 +0100
Subject: [PATCH 076/100] Closes #155.

Thanks to all following PRs.
Closes #156
Closes #158
---
 safaribooks.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/safaribooks.py b/safaribooks.py
index 8647477..95c13a3 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -153,6 +153,9 @@ def intro(self):
         self.out(output)
 
     def parse_description(self, desc):
+        if not desc:
+            return "n/d"
+        
         try:
             return html.fromstring(desc).text_content()
 

From 1b2700768d23736d49be338b23c5fdcd9e311bbe Mon Sep 17 00:00:00 2001
From: Tomasz Piechaczek <tomasz.piechaczek@tesco.com>
Date: Mon, 30 Dec 2019 10:51:27 +0100
Subject: [PATCH 077/100] chore(sb): download full page content

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index 95c13a3..fbad80c 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -808,7 +808,7 @@ def get(self):
                     self.display.book_ad_info = 2
 
             else:
-                self.save_page_html(self.parse_html(self.get_html(next_chapter["web_url"]), first_page))
+                self.save_page_html(self.parse_html(self.get_html(next_chapter["content"]), first_page))
 
             self.display.state(len_books, len_books - len(self.chapters_queue))
 

From 40a1a4885ab2096fc476e4469cc0f811fe8bee54 Mon Sep 17 00:00:00 2001
From: spacewander <spacewanderlzx@gmail.com>
Date: Thu, 2 Jan 2020 15:27:29 +0800
Subject: [PATCH 078/100] Don't try to write down the image file if download
 failed

---
 safaribooks.py | 1 +
 1 file changed, 1 insertion(+)
 mode change 100644 => 100755 safaribooks.py

diff --git a/safaribooks.py b/safaribooks.py
old mode 100644
new mode 100755
index 95c13a3..6514e26
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -850,6 +850,7 @@ def _thread_download_images(self, url):
             response = self.requests_provider(urljoin(SAFARI_BASE_URL, url), stream=True)
             if response == 0:
                 self.display.error("Error trying to retrieve this image: %s\n    From: %s" % (image_name, url))
+                return
 
             with open(image_path, 'wb') as img:
                 for chunk in response.iter_content(1024):

From 4fb8b6e3eb8528df595bb2fd462651050669fa3c Mon Sep 17 00:00:00 2001
From: Ian O'Malley <omalleyian18@gmail.com>
Date: Tue, 24 Mar 2020 13:18:02 -0400
Subject: [PATCH 079/100] Replace any None JSON values with 'n/a'

---
 safaribooks.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/safaribooks.py b/safaribooks.py
index 95c13a3..3628214 100644
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -529,6 +529,10 @@ def get_book_info(self):
 
         if "last_chapter_read" in response:
             del response["last_chapter_read"]
+            
+        for key, value in response.items():
+            if value is None:
+                response[key] = 'n/a'
 
         return response
 

From daaf086aba49045266078a2627cbabe6f00a04f0 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Sat, 18 Apr 2020 23:00:55 +0200
Subject: [PATCH 080/100] Fix CSS issues and Login (thanks @jp-13 and @noxymon)
 Closes #198 Closes #200

---
 README.md      |  5 +++--
 safaribooks.py | 52 +++++++++++++++++++++++++++++++++-----------------
 sso_cookies.py | 43 +++++++++++++++++++++++++++++++++++++++++
 3 files changed, 80 insertions(+), 20 deletions(-)
 create mode 100644 sso_cookies.py

diff --git a/README.md b/README.md
index 92fb558..964513e 100644
--- a/README.md
+++ b/README.md
@@ -72,8 +72,9 @@ optional arguments:
   --help               Show this help message.
 ```
   
-The first time you use the program, you'll have to specify your Safari Books Online account credentials (look [`here`](/../../issues/15) for special character).
-The next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json` (for **SSO** look the file format [`here`](/../../issues/2#issuecomment-367726544)). 
+The first time you use the program, you'll have to specify your Safari Books Online account credentials (look [`here`](/../../issues/15) for special character).  
+The next times you'll download a book, before session expires, you can omit the credential, because the program save your session cookies in a file called `cookies.json`.  
+For **SSO**, please use the `sso_cookies.py` program in order to create the `cookies.json` file from the SSO cookies retrieved by your browser session (please follow [`these steps`](/../../issues/150#issuecomment-555423085)).  
   
 Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
 If you don't want to cache the cookies, just use the `--no-cookies` option and provide all time your `--cred` to perform `--login`.
diff --git a/safaribooks.py b/safaribooks.py
index 4146ef3..c8cf9e3 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -30,6 +30,10 @@
 API_ORIGIN_URL = "https://" + API_ORIGIN_HOST
 PROFILE_URL = SAFARI_BASE_URL + "/profile/"
 
+# DEBUG
+USE_PROXY = True
+PROXIES = {"https": "https://127.0.0.1:8080"}
+
 
 class Display:
     BASE_FORMAT = logging.Formatter(
@@ -312,13 +316,17 @@ def __init__(self, args):
         self.display.intro()
 
         self.session = requests.Session()
+        if USE_PROXY:  # DEBUG
+            self.session.proxies = PROXIES
+            self.session.verify = False
+
         self.session.headers.update(self.HEADERS)
 
         self.jwt = {}
 
         if not args.cred:
             if not os.path.isfile(COOKIES_FILE):
-                self.display.exit("Login: unable to find cookies file.\n"
+                self.display.exit("Login: unable to find `cookies.json` file.\n"
                                   "    Please use the `--cred` or `--login` options to perform the login.")
 
             self.session.cookies.update(json.load(open(COOKIES_FILE)))
@@ -364,6 +372,7 @@ def __init__(self, args):
 
         self.chapter_title = ""
         self.filename = ""
+        self.chapter_stylesheets = []
         self.css = []
         self.images = []
 
@@ -655,9 +664,17 @@ def parse_html(self, root, first_page=False):
             )
 
         page_css = ""
+        if len(self.chapter_stylesheets):
+            for chapter_css_url in self.chapter_stylesheets:
+                if chapter_css_url not in self.css:
+                    self.css.append(chapter_css_url)
+                    self.display.log("Crawler: found a new CSS at %s" % chapter_css_url)
+
+                page_css += "<link href=\"Styles/Style{0:0>2}.css\" " \
+                            "rel=\"stylesheet\" type=\"text/css\" />\n".format(self.css.index(chapter_css_url))
+
         stylesheet_links = root.xpath("//link[@rel='stylesheet']")
         if len(stylesheet_links):
-            stylesheet_count = 0
             for s in stylesheet_links:
                 css_url = urljoin("https:", s.attrib["href"]) if s.attrib["href"][:2] == "//" \
                     else urljoin(self.base_url, s.attrib["href"])
@@ -667,8 +684,7 @@ def parse_html(self, root, first_page=False):
                     self.display.log("Crawler: found a new CSS at %s" % css_url)
 
                 page_css += "<link href=\"Styles/Style{0:0>2}.css\" " \
-                            "rel=\"stylesheet\" type=\"text/css\" />\n".format(stylesheet_count)
-                stylesheet_count += 1
+                            "rel=\"stylesheet\" type=\"text/css\" />\n".format(self.css.index(css_url))
 
         stylesheets = root.xpath("//style")
         if len(stylesheets):
@@ -795,6 +811,14 @@ def get(self):
             self.chapter_title = next_chapter["title"]
             self.filename = next_chapter["filename"]
 
+            # Stylesheets
+            self.chapter_stylesheets = []
+            if "stylesheets" in next_chapter and len(next_chapter["stylesheets"]):
+                self.chapter_stylesheets.extend(x["url"] for x in next_chapter["stylesheets"])
+
+            if "site_styles" in next_chapter and len(next_chapter["site_styles"]):
+                self.chapter_stylesheets.extend(next_chapter["site_styles"])
+
             if os.path.isfile(os.path.join(self.BOOK_PATH, "OEBPS", self.filename.replace(".html", ".xhtml"))):
                 if not self.display.book_ad_info and \
                         next_chapter not in self.book_chapters[:self.book_chapters.index(next_chapter)]:
@@ -879,13 +903,9 @@ def _start_multiprocessing(self, operation, full_queue):
     def collect_css(self):
         self.display.state_status.value = -1
 
-        if "win" in sys.platform:
-            # TODO
-            for css_url in self.css:
-                self._thread_download_css(css_url)
-
-        else:
-            self._start_multiprocessing(self._thread_download_css, self.css)
+        # "self._start_multiprocessing" seems to cause problem. Switching to mono-thread download.
+        for css_url in self.css:
+            self._thread_download_css(css_url)
 
     def collect_images(self):
         if self.display.book_ad_info == 2:
@@ -896,13 +916,9 @@ def collect_images(self):
 
         self.display.state_status.value = -1
 
-        if "win" in sys.platform:
-            # TODO
-            for image_url in self.images:
-                self._thread_download_images(image_url)
-
-        else:
-            self._start_multiprocessing(self._thread_download_images, self.images)
+        # "self._start_multiprocessing" seems to cause problem. Switching to mono-thread download.
+        for image_url in self.images:
+            self._thread_download_images(image_url)
 
     def create_content_opf(self):
         self.css = next(os.walk(self.css_path))[2]
diff --git a/sso_cookies.py b/sso_cookies.py
new file mode 100644
index 0000000..a408f84
--- /dev/null
+++ b/sso_cookies.py
@@ -0,0 +1,43 @@
+"""
+Script for SSO support, saves and converts the cookie string retrieved by the browser.
+Please follow:
+- https://github.com/lorenzodifuccia/safaribooks/issues/26
+- https://github.com/lorenzodifuccia/safaribooks/issues/150#issuecomment-555423085
+- https://github.com/lorenzodifuccia/safaribooks/issues/2#issuecomment-367726544
+
+
+Thanks: @elrob, @noxymon
+"""
+
+import json
+import safaribooks
+
+
+def transform(cookies_string):
+    cookies = {}
+    for cookie in cookies_string.split(";"):
+        cookie = cookie.strip()
+        key, value = cookie.split("=", 1)
+        cookies[key] = value
+
+    print(cookies)
+    json.dump(cookies, open(safaribooks.COOKIES_FILE, 'w'))
+    print("\n\nDone! Cookie Jar saved into `cookies.json`. "
+          "Now you can run `safaribooks.py` without the `--cred` argument...")
+
+
+USAGE = "\n\n[*] Please use this command putting as argument the cookies retrieved by your browser.\n" + \
+        "[+] In order to do so, please follow these steps: \n" + \
+        "https://github.com/lorenzodifuccia/safaribooks/issues/150#issuecomment-555423085\n"
+
+if __name__ == "__main__":
+    import sys
+    if len(sys.argv) < 2:
+        print("[!] Error: too few arguments." + USAGE)
+        exit(1)
+
+    elif len(sys.argv) > 2:
+        print("[!] Error: too much arguments, try to enclose the string with quote '\"'." + USAGE)
+        exit(1)
+
+    transform(sys.argv[1])

From 669d0d0604d9332bdb944e277db0120d5206d46b Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Sat, 18 Apr 2020 23:15:53 +0200
Subject: [PATCH 081/100] Debug to FALSE

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index c8cf9e3..6e3a894 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -31,7 +31,7 @@
 PROFILE_URL = SAFARI_BASE_URL + "/profile/"
 
 # DEBUG
-USE_PROXY = True
+USE_PROXY = False
 PROXIES = {"https": "https://127.0.0.1:8080"}
 
 

From b87d87495e934e8c109abc13229bc07f7217811f Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 30 Apr 2020 19:02:43 +0200
Subject: [PATCH 082/100] Fix #210

Update HTTP Headers
Add check for subscription expiration
Add a script to register to ORLY
---
 register_user.py | 153 +++++++++++++++++++++++++++++++++++++++++++++++
 safaribooks.py   |  18 +++---
 2 files changed, 163 insertions(+), 8 deletions(-)
 create mode 100644 register_user.py

diff --git a/register_user.py b/register_user.py
new file mode 100644
index 0000000..93f3fc6
--- /dev/null
+++ b/register_user.py
@@ -0,0 +1,153 @@
+import re
+import requests
+import safaribooks
+
+REGISTER_URL = safaribooks.SAFARI_BASE_URL + "/register/"
+CHECK_EMAIL = safaribooks.SAFARI_BASE_URL + "/check-email-availability/"
+CHECK_PWD = safaribooks.SAFARI_BASE_URL + "/check-password/"
+
+# DEBUG
+USE_PROXY = False
+PROXIES = {"https": "https://127.0.0.1:8080"}
+
+CSRF_TOKEN_RE = re.compile(r"(?<=name='csrfmiddlewaretoken' value=')([^']+)")
+
+
+class Register:
+    def __init__(self, email, password, first_name, second_name, country="US", referrer="podcast"):
+        self.email = email
+        self.password = password
+        self.first_name = first_name
+        self.second_name = second_name
+        self.country = country
+        self.referrer = referrer
+
+        self.csrf = None
+
+        self.session = requests.Session()
+        if USE_PROXY:  # DEBUG
+            self.session.proxies = PROXIES
+            self.session.verify = False
+
+        self.session.headers.update(safaribooks.SafariBooks.HEADERS)
+        self.session.headers.update({
+            "X-Requested-With": "XMLHttpRequest",
+            "Referer": REGISTER_URL
+        })
+
+        self.register()
+
+    def handle_cookie_update(self, set_cookie_headers):
+        for morsel in set_cookie_headers:
+            # Handle Float 'max-age' Cookie
+            if safaribooks.SafariBooks.COOKIE_FLOAT_MAX_AGE_PATTERN.search(morsel):
+                cookie_key, cookie_value = morsel.split(";")[0].split("=")
+                self.session.cookies.set(cookie_key, cookie_value)
+
+    def requests_provider(self, url, is_post=False, data=None, perform_redirect=True, check_200=True, **kwargs):
+        try:
+            response = getattr(self.session, "post" if is_post else "get")(
+                url,
+                data=data,
+                allow_redirects=False,
+                **kwargs
+            )
+
+            self.handle_cookie_update(response.raw.headers.getlist("Set-Cookie"))
+
+        except (requests.ConnectionError, requests.ConnectTimeout, requests.RequestException) as request_exception:
+            print("Error: ", str(request_exception))
+            return 0
+
+        if response.is_redirect and perform_redirect:
+            return self.requests_provider(response.next.url, is_post, None, perform_redirect, check_200, **kwargs)
+
+        if check_200 and response.status_code != 200:
+            print("Invalid response code:\n", response.text)
+            return 0
+
+        return response
+
+    def register(self):
+        # Take first cookie + csrf
+        response = self.requests_provider(REGISTER_URL)
+        if response == 0:
+            print("Error 0x1: unable to reach registration page!")
+            exit(1)
+
+        if "csrfmiddlewaretoken' value='" not in response.text:
+            print("Error 0x2: CSRF token not present")
+            exit(1)
+
+        csrf_search = CSRF_TOKEN_RE.findall(response.text)
+        if not len(csrf_search):
+            print("Error 0x3: CSRF token RE error")
+            exit(1)
+
+        self.csrf = csrf_search[0]
+
+        # Check user validity
+        response = self.requests_provider(CHECK_EMAIL, params={"email": self.email})
+        if response == 0:
+            print("Error 0x4: unable to check email!")
+            exit(1)
+
+        response_dict = response.json()
+        if not response_dict["success"]:
+            print("Error 0x5:", response_dict["message"])
+            exit(1)
+
+        # Check password validity
+        response = self.requests_provider(CHECK_PWD, is_post=True, data={
+            "csrfmiddlewaretoken": self.csrf,
+            "password1": self.password,
+            "field_name": "password1"
+        })
+        if response == 0:
+            print("Error 0x6: unable to check password!")
+            exit(1)
+
+        response_dict = response.json()
+        if not response_dict["valid"]:
+            print("Error 0x7:", response_dict["msg"])
+            exit(1)
+
+        # Register
+        response = self.requests_provider(REGISTER_URL, is_post=True, data={
+            "next": "",
+            "trial_length": 10,
+            "csrfmiddlewaretoken": self.csrf,
+            "first_name": self.first_name,
+            "last_name": self.second_name,
+            "email": self.email,
+            "password1": self.password,
+            "country": self.country,
+            "referrer": "podcast",
+            "recently_viewed_bits": "[]"
+        }, check_200=False)
+        if response == 0:
+            print("Error 0x8: unable to register!")
+            exit(1)
+
+        elif response.status_code != 201:
+            print("Error: 0x9: invalid status code while registering!")
+            exit(1)
+
+        print("[*] Account registered: \nEMAIL: %s\nPASSWORD: %s" % (self.email, self.password))
+        return
+
+
+if __name__ == "__main__":
+    import sys
+    if len(sys.argv) < 3:
+        print("[!] Error: too few arguments.\nRun `register_user.py EMAIL PASSWORD`.")
+        exit(1)
+
+    elif len(sys.argv) > 3:
+        print("[!] Error: too much arguments, try to enclose the string with quote '\"'.")
+        exit(1)
+
+    FIRST_NAME = "Safari"
+    SECOND_NAME = "Download"
+
+    Register(sys.argv[1], sys.argv[2], FIRST_NAME, SECOND_NAME)
diff --git a/safaribooks.py b/safaribooks.py
index 6e3a894..c29dc40 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -299,13 +299,12 @@ class SafariBooks:
               "</ncx>"
 
     HEADERS = {
-        "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8",
-        "accept-encoding": "gzip, deflate",
-        "origin": SAFARI_BASE_URL,
-        "referer": LOGIN_ENTRY_URL,
-        "upgrade-insecure-requests": "1",
-        "user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
-                      "Chrome/60.0.3112.113 Safari/537.36"
+        "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8",
+        "Accept-Encoding": "gzip, deflate",
+        "Referer": LOGIN_ENTRY_URL,
+        "Upgrade-Insecure-Requests": "1",
+        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
+                      "Chrome/80.0.3987.163 Safari/537.36"
     }
 
     COOKIE_FLOAT_MAX_AGE_PATTERN = re.compile(r'(max-age=\d*\.\d*)', re.IGNORECASE)
@@ -522,9 +521,12 @@ def check_login(self):
         if response == 0:
             self.display.exit("Login: unable to reach Safari Books Online. Try again...")
 
-        if response.status_code != 200:
+        elif response.status_code != 200:
             self.display.exit("Authentication issue: unable to access profile page.")
 
+        elif "user_type\":\"Expired" in response.text:
+            self.display.exit("Authentication issue: account subscription expired.")
+
         self.display.info("Successfully authenticated.", state=True)
 
     def get_book_info(self):

From 912c68b15cf6545ae7fe0fb1493181641580df31 Mon Sep 17 00:00:00 2001
From: nrenzoni <nrenzoni1@gmail.com>
Date: Sun, 17 May 2020 17:11:52 +0300
Subject: [PATCH 083/100] fix extracting img urls

---
 safaribooks.py | 25 +++++++++++++++++--------
 1 file changed, 17 insertions(+), 8 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index c29dc40..642c9f9 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -1,5 +1,6 @@
 #!/usr/bin/env python3
 # coding: utf-8
+import pathlib
 import re
 import os
 import sys
@@ -348,6 +349,8 @@ def __init__(self, args):
         self.display.info("Retrieving book chapters...")
         self.book_chapters = self.get_book_chapters()
 
+        self.images = self.extract_image_links(self.book_chapters)
+
         self.chapters_queue = self.book_chapters[:]
 
         if len(self.book_chapters) > sys.getrecursionlimit():
@@ -373,7 +376,6 @@ def __init__(self, args):
         self.filename = ""
         self.chapter_stylesheets = []
         self.css = []
-        self.images = []
 
         self.display.info("Downloading book contents... (%s chapters)" % len(self.book_chapters), state=True)
         self.BASE_HTML = self.BASE_01_HTML + (self.KINDLE_HTML if not args.no_kindle else "") + self.BASE_02_HTML
@@ -609,16 +611,15 @@ def get_html(self, url):
     def url_is_absolute(url):
         return bool(urlparse(url).netloc)
 
+    @staticmethod
+    def is_image_link(url: str):
+        return pathlib.Path(url).suffix[1:] in ["jpg", "peg", "png", "gif"]
+
     def link_replace(self, link):
         if link and not link.startswith("mailto"):
             if not self.url_is_absolute(link):
-                if "cover" in link or "images" in link or "graphics" in link or \
-                        link[-3:] in ["jpg", "peg", "png", "gif"]:
-                    link = urljoin(self.base_url, link)
-                    if link not in self.images:
-                        self.images.append(link)
-                        self.display.log("Crawler: found a new image at %s" % link)
-
+                if any(x in link for x in ["cover", "images", "graphics"]) or \
+                        self.is_image_link(link):
                     image = link.split("/")[-1]
                     return "Images/" + image
 
@@ -1044,6 +1045,14 @@ def create_epub(self):
         shutil.make_archive(zip_file, 'zip', self.BOOK_PATH)
         os.rename(zip_file + ".zip", os.path.join(self.BOOK_PATH, self.book_id) + ".epub")
 
+    @staticmethod
+    def extract_image_links(chapters):
+        imgs = []
+        for chapter in chapters:
+            chapter_imgs = [urljoin(chapter['asset_base_url'], img_url) for img_url in chapter['images']]
+            imgs.extend(chapter_imgs)
+        return imgs
+
 
 # MAIN
 if __name__ == "__main__":

From 776c0d79b82b85869b0569b3665fc356debfb369 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 20 May 2020 22:49:03 +0200
Subject: [PATCH 084/100] Improvement, `kindle` and README (thanks @nrenzoni)

---
 .gitignore     |  3 ++
 README.md      | 78 ++++++++++++++++++++++++++++----------------------
 safaribooks.py | 32 +++++++++------------
 3 files changed, 60 insertions(+), 53 deletions(-)

diff --git a/.gitignore b/.gitignore
index 260a1cc..90e00eb 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,5 +1,7 @@
 .idea/
 .vscode/
+
+__pycache__/
 .venv/
 .env/
 
@@ -7,3 +9,4 @@ Books/
 
 cookies.json
 *.log
+*.txt
diff --git a/README.md b/README.md
index 964513e..cac2d92 100644
--- a/README.md
+++ b/README.md
@@ -7,9 +7,10 @@ Before any usage please read the *O'Reilly*'s [Terms of Service](https://learnin
   * [Requirements & Setup](#requirements--setup)
   * [Usage](#usage)
   * [Example: Download *Test-Driven Development with Python, 2nd Edition*](#download-test-driven-development-with-python-2nd-edition)
-  * [Example: Use or not the `--no-kindle` option](#use-or-not-the---no-kindle-option)
+  * [Example: Use or not the `--kindle` option](#use-or-not-the---kindle-option)
 
 ## Requirements & Setup:
+First of all, it requires `python3` and `pip3` or `pipenv` to be installed.  
 ```shell
 $ git clone https://github.com/lorenzodifuccia/safaribooks.git
 Cloning into 'safaribooks'...
@@ -22,7 +23,7 @@ OR
 $ pipenv install && pipenv shell
 ```  
 
-The program depends of only two **Python 3** modules:
+The program depends of only two **Python _3_** modules:
 ```python3
 lxml>=4.1.1
 requests>=2.20.0
@@ -44,30 +45,30 @@ Like: `https://www.safaribooksonline.com/library/view/test-driven-development-wi
 #### Program options:
 ```shell
 $ python3 safaribooks.py --help
-usage: safaribooks.py [--cred <EMAIL:PASS> | --login] [--no-cookies] [--no-kindle]
-                      [--preserve-log] [--help]
+usage: safaribooks.py [--cred <EMAIL:PASS> | --login] [--no-cookies]
+                      [--kindle] [--preserve-log] [--help]
                       <BOOK ID>
 
-Download and generate EPUB of your favorite books from Safari Books Online.
+Download and generate an EPUB of your favorite books from Safari Books Online.
 
 positional arguments:
-  <BOOK ID>            Book digits ID that you want to download.
-                       You can find it in the URL (X-es):
-                       `https://www.safaribooksonline.com/library/view/book-
+  <BOOK ID>            Book digits ID that you want to download. You can find
+                       it in the URL (X-es):
+                       `https://learning.oreilly.com/library/view/book-
                        name/XXXXXXXXXXXXX/`
 
 optional arguments:
   --cred <EMAIL:PASS>  Credentials used to perform the auth login on Safari
-                       Books Online.
-                       Es. ` --cred "account_mail@mail.com:password01" `.
+                       Books Online. Es. ` --cred
+                       "account_mail@mail.com:password01" `.
   --login              Prompt for credentials used to perform the auth login
                        on Safari Books Online.
   --no-cookies         Prevent your session data to be saved into
                        `cookies.json` file.
-  --no-kindle          Remove some CSS rules that block overflow on `table`
-                       and `pre` elements. Use this option if you're not going
-                       to export the EPUB to E-Readers like Amazon Kindle.
-  --preserve-log       Leave the `info_XXXXXXXXXXXXX.log` file even if there 
+  --kindle             Add some CSS rules that block overflow on `table` and
+                       `pre` elements. Use this option if you're going to
+                       export the EPUB to E-Readers like Amazon Kindle.
+  --preserve-log       Leave the `info_XXXXXXXXXXXXX.log` file even if there
                        isn't any error.
   --help               Show this help message.
 ```
@@ -77,21 +78,26 @@ The next times you'll download a book, before session expires, you can omit the
 For **SSO**, please use the `sso_cookies.py` program in order to create the `cookies.json` file from the SSO cookies retrieved by your browser session (please follow [`these steps`](/../../issues/150#issuecomment-555423085)).  
   
 Pay attention if you use a shared PC, because everyone that has access to your files can steal your session. 
-If you don't want to cache the cookies, just use the `--no-cookies` option and provide all time your `--cred` to perform `--login`.
+If you don't want to cache the cookies, just use the `--no-cookies` option and provide all time your credential through the `--cred` option or the more safe `--login` one: this will prompt you for credential during the script execution.
 
-You can configure proxies by setting on your system the environment variable `HTTPS_PROXY`.
+You can configure proxies by setting on your system the environment variable `HTTPS_PROXY` or using the `USE_PROXY` directive into the script.
 
-The program default options are thought for ensure best compatibilities for who want to export the `EPUB` to E-Readers like Amazon Kindle. If you want to do it, I suggest you to convert the `EPUB` to `AZW3` with [Calibre](https://calibre-ebook.com/).  
-You can also convert the book to `MOBI` and if you'll do it with Calibre be sure to select `Ignore margins` in the conversion options:  
+**Important**: since the script only download HTML pages and create a row EPUB, many of the CSS and XML/HTML directives are wrong for an E-Reader. To ensure best quality of the output, I suggest you to always convert the `EPUB` obtained by the script to standard-`EPUB` with [Calibre](https://calibre-ebook.com/).
+You can also use the command-line version of Calibre with `ebook-convert`, e.g.:
+```bash
+$ ebook-convert "XXXX/safaribooks/Books/Test-Driven Development with Python 2nd Edition (9781491958698)/9781491958698.epub" "XXXX/safaribooks/Books/Test-Driven Development with Python 2nd Edition (9781491958698)/9781491958698_CLEAR.epub"
+```
+After the execution, you can read the `9781491958698_CLEAR.epub` in every E-Reader and delete all other files.
+
+The program offers also an option to ensure best compatibilities for who wants to export the `EPUB` to E-Readers like Amazon Kindle: `--kindle`, it blocks overflow on `table` and `pre` elements (see [example](#use-or-not-the---kindle-option)).  
+In this case, I suggest you to convert the `EPUB` to `AZW3` with Calibre or to `MOBI`, remember in this case to select `Ignore margins` in the conversion options:  
   
 ![Calibre IgnoreMargins](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_calibre_IgnoreMargins.png "Select Ignore margins")  
-
-In the other hand, if you're not going to export the `EPUB`, you can use the `--no-kindle` option to remove the CSS that blocks overflow on `table` and `pre` elements, see below in the examples.  
   
 ## Examples:
   * ## Download [Test-Driven Development with Python, 2nd Edition](https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/):  
     ```shell
-    $ python3 safaribooks.py --cred "XXXX@gmail.com:XXXXX" 9781491958698
+    $ python3 safaribooks.py --cred "my_email@gmail.com:MyPassword1!" 9781491958698
 
            ____     ___         _ 
           / __/__ _/ _/__ _____(_)
@@ -118,32 +124,36 @@ In the other hand, if you're not going to export the `EPUB`, you can use the `--
     that works.In the process, you’ll learn the basics of Django, Selenium, Git, 
     jQuery, and Mock, along with curre...
     [-] Release Date: 2017-08-18
-    [-] URL: https://www.safaribooksonline.com/library/view/test-driven-development-with/9781491958698/
-    [*] Retrieving book chapters...                                                          
+    [-] URL: https://learning.oreilly.com/library/view/test-driven-development-with/9781491958698/
+    [*] Retrieving book chapters...                                                 
     [*] Output directory:                                                           
-        /XXXX/XXXX/Books/Test-Driven Development with Python, 2nd Edition
-    [-] Downloading book contents... (73 chapters)                                               
-        [#########################################----------------------------]  60%
-    ...
+        /XXXX/safaribooks/Books/Test-Driven Development with Python 2nd Edition (9781491958698)
+    [-] Downloading book contents... (53 chapters)                                  
+        [#####################################################################] 100%
+    [-] Downloading book CSSs... (2 files)                                          
+        [#####################################################################] 100%
+    [-] Downloading book images... (142 files)                                      
+        [#####################################################################] 100%
     [-] Creating EPUB file...                                                       
-    [*] Done: Test-Driven Development with Python, 2nd Edition.epub                 
-
+    [*] Done: /XXXX/safaribooks/Books/Test-Driven Development with Python 2nd Edition 
+    (9781491958698)/9781491958698.epub
+    
         If you like it, please * this project on GitHub to make it known:
             https://github.com/lorenzodifuccia/safaribooks
         e don't forget to renew your Safari Books Online subscription:
-            https://www.safaribooksonline.com/signup/
-
+            https://learning.oreilly.com
+    
     [!] Bye!!
     ```  
      The result will be (opening the `EPUB` file with Calibre):  
 
     ![Book Appearance](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_example01_TDD.png "Book opened with Calibre")  
  
-  * ## Use or not the `--no-kindle` option:
+  * ## Use or not the `--kindle` option:
     ```bash
-    $ python3 safaribooks.py --no-kindle 9781491958698
+    $ python3 safaribooks.py --kindle 9781491958698
     ```  
-    On the left book created with `--no-kindle` option, on the right without (default):  
+    On the right, the book created with `--kindle` option, on the left without (default):  
     
     ![NoKindle Option](https://github.com/lorenzodifuccia/cloudflare/raw/master/Images/safaribooks/safaribooks_example02_NoKindle.png "Version compare")  
     
diff --git a/safaribooks.py b/safaribooks.py
index 642c9f9..b0bad40 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -239,11 +239,10 @@ class SafariBooks:
                    "<head>\n" \
                    "{0}\n" \
                    "<style type=\"text/css\">" \
-                   "body{{margin:1em;}}" \
+                   "body{{margin:1em;background-color:transparent!important;}}" \
                    "#sbo-rt-content *{{text-indent:0pt!important;}}#sbo-rt-content .bq{{margin-right:1em!important;}}"
 
-    KINDLE_HTML = "body{{background-color:transparent!important;}}" \
-                  "#sbo-rt-content *{{word-wrap:break-word!important;" \
+    KINDLE_HTML = "#sbo-rt-content *{{word-wrap:break-word!important;" \
                   "word-break:break-word!important;}}#sbo-rt-content table,#sbo-rt-content pre" \
                   "{{overflow-x:unset!important;overflow:unset!important;" \
                   "overflow-y:unset!important;white-space:pre-wrap!important;}}"
@@ -349,8 +348,6 @@ def __init__(self, args):
         self.display.info("Retrieving book chapters...")
         self.book_chapters = self.get_book_chapters()
 
-        self.images = self.extract_image_links(self.book_chapters)
-
         self.chapters_queue = self.book_chapters[:]
 
         if len(self.book_chapters) > sys.getrecursionlimit():
@@ -376,9 +373,10 @@ def __init__(self, args):
         self.filename = ""
         self.chapter_stylesheets = []
         self.css = []
+        self.images = []
 
         self.display.info("Downloading book contents... (%s chapters)" % len(self.book_chapters), state=True)
-        self.BASE_HTML = self.BASE_01_HTML + (self.KINDLE_HTML if not args.no_kindle else "") + self.BASE_02_HTML
+        self.BASE_HTML = self.BASE_01_HTML + (self.KINDLE_HTML if not args.kindle else "") + self.BASE_02_HTML
 
         self.cover = False
         self.get()
@@ -613,7 +611,7 @@ def url_is_absolute(url):
 
     @staticmethod
     def is_image_link(url: str):
-        return pathlib.Path(url).suffix[1:] in ["jpg", "peg", "png", "gif"]
+        return pathlib.Path(url).suffix[1:].lower() in ["jpg", "jpeg", "png", "gif"]
 
     def link_replace(self, link):
         if link and not link.startswith("mailto"):
@@ -814,6 +812,11 @@ def get(self):
             self.chapter_title = next_chapter["title"]
             self.filename = next_chapter["filename"]
 
+            # Images
+            if "images" in next_chapter and len(next_chapter["images"]):
+                self.images.extend(urljoin(next_chapter['asset_base_url'], img_url)
+                                   for img_url in next_chapter['images'])
+
             # Stylesheets
             self.chapter_stylesheets = []
             if "stylesheets" in next_chapter and len(next_chapter["stylesheets"]):
@@ -1045,14 +1048,6 @@ def create_epub(self):
         shutil.make_archive(zip_file, 'zip', self.BOOK_PATH)
         os.rename(zip_file + ".zip", os.path.join(self.BOOK_PATH, self.book_id) + ".epub")
 
-    @staticmethod
-    def extract_image_links(chapters):
-        imgs = []
-        for chapter in chapters:
-            chapter_imgs = [urljoin(chapter['asset_base_url'], img_url) for img_url in chapter['images']]
-            imgs.extend(chapter_imgs)
-        return imgs
-
 
 # MAIN
 if __name__ == "__main__":
@@ -1078,9 +1073,9 @@ def extract_image_links(chapters):
         help="Prevent your session data to be saved into `cookies.json` file."
     )
     arguments.add_argument(
-        "--no-kindle", dest="no_kindle", action='store_true',
-        help="Remove some CSS rules that block overflow on `table` and `pre` elements."
-             " Use this option if you're not going to export the EPUB to E-Readers like Amazon Kindle."
+        "--kindle", dest="kindle", action='store_true',
+        help="Add some CSS rules that block overflow on `table` and `pre` elements."
+             " Use this option if you're going to export the EPUB to E-Readers like Amazon Kindle."
     )
     arguments.add_argument(
         "--preserve-log", dest="log", action='store_true', help="Leave the `info_XXXXXXXXXXXXX.log`"
@@ -1094,7 +1089,6 @@ def extract_image_links(chapters):
     )
 
     args_parsed = arguments.parse_args()
-
     if args_parsed.cred or args_parsed.login:
         user_email = ""
         pre_cred = ""

From e1c959a5b8e908c49976a08196b3d4e0f6d40836 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 20 May 2020 22:54:26 +0200
Subject: [PATCH 085/100] README: typo

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index cac2d92..b9bbc0f 100644
--- a/README.md
+++ b/README.md
@@ -82,7 +82,7 @@ If you don't want to cache the cookies, just use the `--no-cookies` option and p
 
 You can configure proxies by setting on your system the environment variable `HTTPS_PROXY` or using the `USE_PROXY` directive into the script.
 
-**Important**: since the script only download HTML pages and create a row EPUB, many of the CSS and XML/HTML directives are wrong for an E-Reader. To ensure best quality of the output, I suggest you to always convert the `EPUB` obtained by the script to standard-`EPUB` with [Calibre](https://calibre-ebook.com/).
+**Important**: since the script only download HTML pages and create a raw EPUB, many of the CSS and XML/HTML directives are wrong for an E-Reader. To ensure best quality of the output, I suggest you to always convert the `EPUB` obtained by the script to standard-`EPUB` with [Calibre](https://calibre-ebook.com/).
 You can also use the command-line version of Calibre with `ebook-convert`, e.g.:
 ```bash
 $ ebook-convert "XXXX/safaribooks/Books/Test-Driven Development with Python 2nd Edition (9781491958698)/9781491958698.epub" "XXXX/safaribooks/Books/Test-Driven Development with Python 2nd Edition (9781491958698)/9781491958698_CLEAR.epub"

From c5f8cdb9719fdcf1846fc0da409e9c158d038ae1 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 22 Jul 2020 02:15:05 +0200
Subject: [PATCH 086/100] Create LICENSE.md

---
 LICENSE.md | 13 +++++++++++++
 1 file changed, 13 insertions(+)
 create mode 100644 LICENSE.md

diff --git a/LICENSE.md b/LICENSE.md
new file mode 100644
index 0000000..5c93f45
--- /dev/null
+++ b/LICENSE.md
@@ -0,0 +1,13 @@
+            DO WHAT THE FUCK YOU WANT TO PUBLIC LICENSE
+                    Version 2, December 2004
+
+ Copyright (C) 2004 Sam Hocevar <sam@hocevar.net>
+
+ Everyone is permitted to copy and distribute verbatim or modified
+ copies of this license document, and changing it is allowed as long
+ as the name is changed.
+
+            DO WHAT THE FUCK YOU WANT TO PUBLIC LICENSE
+   TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION
+
+  0. You just DO WHAT THE FUCK YOU WANT TO.

From b16905f692f3cb4bbd683e70459c2762e9ff1aad Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 15 Oct 2020 14:47:46 +0200
Subject: [PATCH 087/100] Fix #224

---
 safaribooks.py | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index d6f3e67..98ca66d 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -830,14 +830,9 @@ def get(self):
                         next_chapter not in self.book_chapters[:self.book_chapters.index(next_chapter)]:
                     self.display.info(
                         ("File `%s` already exists.\n"
-                         "    If you want to download again all the book%s,\n"
+                         "    If you want to download again all the book,\n"
                          "    please delete the output directory '" + self.BOOK_PATH + "' and restart the program.")
-                        %
-                        (
-                            self.filename.replace(".html", ".xhtml"),
-                            " (especially because you selected the `--no-kindle` option)"
-                            if self.args.no_kindle else ""
-                        )
+                         % self.filename.replace(".html", ".xhtml")
                     )
                     self.display.book_ad_info = 2
 

From a6a0962f55b72993749a03f45ce86611de185342 Mon Sep 17 00:00:00 2001
From: Ai Tran <ai.tran@flightaware.com>
Date: Thu, 19 Nov 2020 22:27:19 -0600
Subject: [PATCH 088/100] Use get method to fetch value for "rights" key in
 book dictionary

---
 safaribooks.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 98ca66d..98fe1cf 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -174,7 +174,7 @@ def book_info(self, info):
             ("Title", info["title"]), ("Authors", ", ".join(aut["name"] for aut in info["authors"])),
             ("Identifier", info["identifier"]), ("ISBN", info["isbn"]),
             ("Publishers", ", ".join(pub["name"] for pub in info["publishers"])),
-            ("Rights", info["rights"]),
+            ("Rights", info.get("rights", "")),
             ("Description", description[:500] + "..." if len(description) >= 500 else description),
             ("Release Date", info["issued"]),
             ("URL", info["web_url"])
@@ -961,7 +961,7 @@ def create_content_opf(self):
             escape(self.book_info["description"]),
             subjects,
             ", ".join(escape(pub["name"]) for pub in self.book_info["publishers"]),
-            escape(self.book_info["rights"]) if self.book_info["rights"] else "",
+            escape(self.book_info.get("rights", "")),
             self.book_info["issued"],
             self.cover,
             "\n".join(manifest),

From 22758a3edbc77362c4188a73ed56aea4641ce150 Mon Sep 17 00:00:00 2001
From: Ai Tran <ai.tran@flightaware.com>
Date: Thu, 19 Nov 2020 22:53:09 -0600
Subject: [PATCH 089/100] SB237: Replace dictionary lookup with get method with
 default value.

---
 safaribooks.py | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 98fe1cf..8e80e73 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -171,13 +171,13 @@ def parse_description(self, desc):
     def book_info(self, info):
         description = self.parse_description(info["description"]).replace("\n", " ")
         for t in [
-            ("Title", info["title"]), ("Authors", ", ".join(aut["name"] for aut in info["authors"])),
-            ("Identifier", info["identifier"]), ("ISBN", info["isbn"]),
-            ("Publishers", ", ".join(pub["name"] for pub in info["publishers"])),
+            ("Title", info.get("title", "")), ("Authors", ", ".join(aut["name"] for aut in info.get("authors", ""))),
+            ("Identifier", info.get("identifier", "")), ("ISBN", info.get("isbn", "")),
+            ("Publishers", ", ".join(pub["name"] for pub in info.get("publishers", ""))),
             ("Rights", info.get("rights", "")),
             ("Description", description[:500] + "..." if len(description) >= 500 else description),
-            ("Release Date", info["issued"]),
-            ("URL", info["web_url"])
+            ("Release Date", info.get("issued", "")),
+            ("URL", info.get("web_url", ""))
         ]:
             self.info("{0}{1}{2}: {3}".format(self.SH_YELLOW, t[0], self.SH_DEFAULT, t[1]), True)
 
@@ -955,14 +955,14 @@ def create_content_opf(self):
                              for sub in self.book_info["subjects"])
 
         return self.CONTENT_OPF.format(
-            (self.book_info["isbn"] if self.book_info["isbn"] else self.book_id),
+            (self.book_info.get("isbn",  self.book_id)),
             escape(self.book_title),
             authors,
-            escape(self.book_info["description"]),
+            escape(self.book_info.get("description", "")),
             subjects,
-            ", ".join(escape(pub["name"]) for pub in self.book_info["publishers"]),
+            ", ".join(escape(pub["name"]) for pub in self.book_info.get("publishers", "")),
             escape(self.book_info.get("rights", "")),
-            self.book_info["issued"],
+            self.book_info.get("issued", ""),
             self.cover,
             "\n".join(manifest),
             "\n".join(spine),

From 992025793589f5f5f8a17c57c41d69192a10dd8f Mon Sep 17 00:00:00 2001
From: Ai Tran <ai.tran@flightaware.com>
Date: Fri, 20 Nov 2020 00:04:20 -0600
Subject: [PATCH 090/100] SB237: Use empty string with empty list for authors,
 publishers and subjects.

---
 safaribooks.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 8e80e73..cf399d1 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -171,9 +171,9 @@ def parse_description(self, desc):
     def book_info(self, info):
         description = self.parse_description(info["description"]).replace("\n", " ")
         for t in [
-            ("Title", info.get("title", "")), ("Authors", ", ".join(aut["name"] for aut in info.get("authors", ""))),
+            ("Title", info.get("title", "")), ("Authors", ", ".join(aut.get("name", "") for aut in info.get("authors", []))),
             ("Identifier", info.get("identifier", "")), ("ISBN", info.get("isbn", "")),
-            ("Publishers", ", ".join(pub["name"] for pub in info.get("publishers", ""))),
+            ("Publishers", ", ".join(pub.get("name", "") for pub in info.get("publishers", []))),
             ("Rights", info.get("rights", "")),
             ("Description", description[:500] + "..." if len(description) >= 500 else description),
             ("Release Date", info.get("issued", "")),
@@ -951,8 +951,8 @@ def create_content_opf(self):
             escape(aut["name"])
         ) for aut in self.book_info["authors"])
 
-        subjects = "\n".join("<dc:subject>{0}</dc:subject>".format(escape(sub["name"]))
-                             for sub in self.book_info["subjects"])
+        subjects = "\n".join("<dc:subject>{0}</dc:subject>".format(escape(sub.get("name", "")))
+                             for sub in self.book_info.get("subjects", []))
 
         return self.CONTENT_OPF.format(
             (self.book_info.get("isbn",  self.book_id)),
@@ -960,7 +960,7 @@ def create_content_opf(self):
             authors,
             escape(self.book_info.get("description", "")),
             subjects,
-            ", ".join(escape(pub["name"]) for pub in self.book_info.get("publishers", "")),
+            ", ".join(escape(pub.get("name", "")) for pub in self.book_info.get("publishers", [])),
             escape(self.book_info.get("rights", "")),
             self.book_info.get("issued", ""),
             self.cover,

From 0868dadc0b61b5c61e6cae9865175263ef4b49ad Mon Sep 17 00:00:00 2001
From: Avineshwar Pratap Singh <asingh16@stevens.edu>
Date: Mon, 23 Nov 2020 09:52:16 -0600
Subject: [PATCH 091/100] Stronger presence check

- Fixes `out-of-range` on a Tuple
- Ensures `KeyError` doesn't happen for the faulty key. I would argue if someone the script should be re-written to accommodate this in the first place.
---
 safaribooks.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 98ca66d..fc4bafa 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -174,7 +174,7 @@ def book_info(self, info):
             ("Title", info["title"]), ("Authors", ", ".join(aut["name"] for aut in info["authors"])),
             ("Identifier", info["identifier"]), ("ISBN", info["isbn"]),
             ("Publishers", ", ".join(pub["name"] for pub in info["publishers"])),
-            ("Rights", info["rights"]),
+            ("Rights", info["rights"] if "rights" in info and info["rights"] else ""),
             ("Description", description[:500] + "..." if len(description) >= 500 else description),
             ("Release Date", info["issued"]),
             ("URL", info["web_url"])
@@ -961,7 +961,7 @@ def create_content_opf(self):
             escape(self.book_info["description"]),
             subjects,
             ", ".join(escape(pub["name"]) for pub in self.book_info["publishers"]),
-            escape(self.book_info["rights"]) if self.book_info["rights"] else "",
+            escape(self.book_info["rights"]) if "rights" in self.book_info and self.book_info["rights"] else "",
             self.book_info["issued"],
             self.cover,
             "\n".join(manifest),

From dbb167a8a184f7ce03f989eebe8158e52207a362 Mon Sep 17 00:00:00 2001
From: hehe <xpc1993@gmail.com>
Date: Wed, 25 Nov 2020 15:11:35 +0800
Subject: [PATCH 092/100] Add .DS_Store to gitignore

---
 .gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.gitignore b/.gitignore
index 90e00eb..539ad1a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,5 +1,6 @@
 .idea/
 .vscode/
+.DS_Store
 
 __pycache__/
 .venv/

From 8dbe6ebaf58fd6bf3ab9df1dd309068007b4ab55 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Thu, 26 Nov 2020 23:26:46 +0100
Subject: [PATCH 093/100] Update safaribooks.py

Try to fix #244 and #236
---
 safaribooks.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index cf399d1..4436db4 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -169,7 +169,7 @@ def parse_description(self, desc):
             return "n/d"
 
     def book_info(self, info):
-        description = self.parse_description(info["description"]).replace("\n", " ")
+        description = self.parse_description(info.get("description", None)).replace("\n", " ")
         for t in [
             ("Title", info.get("title", "")), ("Authors", ", ".join(aut.get("name", "") for aut in info.get("authors", []))),
             ("Identifier", info.get("identifier", "")), ("ISBN", info.get("isbn", "")),
@@ -948,10 +948,10 @@ def create_content_opf(self):
                             "media-type=\"text/css\" />".format(i))
 
         authors = "\n".join("<dc:creator opf:file-as=\"{0}\" opf:role=\"aut\">{0}</dc:creator>".format(
-            escape(aut["name"])
-        ) for aut in self.book_info["authors"])
+            escape(aut.get("name", "n/d")])
+        ) for aut in self.book_info.get("authors", []))
 
-        subjects = "\n".join("<dc:subject>{0}</dc:subject>".format(escape(sub.get("name", "")))
+        subjects = "\n".join("<dc:subject>{0}</dc:subject>".format(escape(sub.get("name", "n/d")))
                              for sub in self.book_info.get("subjects", []))
 
         return self.CONTENT_OPF.format(

From 0afa0d3f6a38546cee946c40b3c858dd2f699397 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 27 Nov 2020 16:27:17 +0100
Subject: [PATCH 094/100] Typo safaribook.py

---
 safaribooks.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/safaribooks.py b/safaribooks.py
index 4436db4..26c9f62 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -948,7 +948,7 @@ def create_content_opf(self):
                             "media-type=\"text/css\" />".format(i))
 
         authors = "\n".join("<dc:creator opf:file-as=\"{0}\" opf:role=\"aut\">{0}</dc:creator>".format(
-            escape(aut.get("name", "n/d")])
+            escape(aut.get("name", "n/d"))
         ) for aut in self.book_info.get("authors", []))
 
         subjects = "\n".join("<dc:subject>{0}</dc:subject>".format(escape(sub.get("name", "n/d")))

From 21553dcbbf7aaadb23c767921f8ea5a85ebe9471 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Thu, 7 Jan 2021 22:02:51 +0000
Subject: [PATCH 095/100] Bump lxml from 4.2.5 to 4.6.2

Bumps [lxml](https://github.com/lxml/lxml) from 4.2.5 to 4.6.2.
- [Release notes](https://github.com/lxml/lxml/releases)
- [Changelog](https://github.com/lxml/lxml/blob/master/CHANGES.txt)
- [Commits](https://github.com/lxml/lxml/compare/lxml-4.2.5...lxml-4.6.2)

Signed-off-by: dependabot[bot] <support@github.com>
---
 Pipfile.lock | 82 ++++++++++++++++++++++++++++------------------------
 1 file changed, 44 insertions(+), 38 deletions(-)

diff --git a/Pipfile.lock b/Pipfile.lock
index a69ad46..d469438 100644
--- a/Pipfile.lock
+++ b/Pipfile.lock
@@ -18,10 +18,10 @@
     "default": {
         "certifi": {
             "hashes": [
-                "sha256:59b7658e26ca9c7339e00f8f4636cdfe59d34fa37b9b04f6f9e9926b3cece1a5",
-                "sha256:b26104d6835d1f5e49452a26eb2ff87fe7090b89dfcaee5ea2212697e1e1d7ae"
+                "sha256:1a4995114262bffbc2413b159f2a1a480c969de6e6eb13ee966d470af86af59c",
+                "sha256:719a74fb9e33b9bd44cc7f3a8d94bc35e4049deebe19ba7d8e108280cfd59830"
             ],
-            "version": "==2019.3.9"
+            "version": "==2020.12.5"
         },
         "chardet": {
             "hashes": [
@@ -39,39 +39,46 @@
         },
         "lxml": {
             "hashes": [
-                "sha256:02bc220d61f46e9b9d5a53c361ef95e9f5e1d27171cd461dddb17677ae2289a5",
-                "sha256:22f253b542a342755f6cfc047fe4d3a296515cf9b542bc6e261af45a80b8caf6",
-                "sha256:2f31145c7ff665b330919bfa44aacd3a0211a76ca7e7b441039d2a0b0451e415",
-                "sha256:36720698c29e7a9626a0dc802ef8885f8f0239bfd1689628ecd459a061f2807f",
-                "sha256:438a1b0203545521f6616132bfe0f4bca86f8a401364008b30e2b26ec408ce85",
-                "sha256:4815892904c336bbaf73dafd54f45f69f4021c22b5bad7332176bbf4fb830568",
-                "sha256:5be031b0f15ad63910d8e5038b489d95a79929513b3634ad4babf77100602588",
-                "sha256:5c93ae37c3c588e829b037fdfbd64a6e40c901d3f93f7beed6d724c44829a3ad",
-                "sha256:60842230678674cdac4a1cf0f707ef12d75b9a4fc4a565add4f710b5fcf185d5",
-                "sha256:62939a8bb6758d1bf923aa1c13f0bcfa9bf5b2fc0f5fa917a6e25db5fe0cfa4e",
-                "sha256:75830c06a62fe7b8fe3bbb5f269f0b308f19f3949ac81cfd40062f47c1455faf",
-                "sha256:81992565b74332c7c1aff6a913a3e906771aa81c9d0c68c68113cffcae45bc53",
-                "sha256:8c892fb0ee52c594d9a7751c7d7356056a9682674b92cc1c4dc968ff0f30c52f",
-                "sha256:9d862e3cf4fc1f2837dedce9c42269c8c76d027e49820a548ac89fdcee1e361f",
-                "sha256:a623965c086a6e91bb703d4da62dabe59fe88888e82c4117d544e11fd74835d6",
-                "sha256:a7783ab7f6a508b0510490cef9f857b763d796ba7476d9703f89722928d1e113",
-                "sha256:aab09fbe8abfa3b9ce62aaf45aca2d28726b1b9ee44871dbe644050a2fff4940",
-                "sha256:abf181934ac3ef193832fb973fd7f6149b5c531903c2ec0f1220941d73eee601",
-                "sha256:ae07fa0c115733fce1e9da96a3ac3fa24801742ca17e917e0c79d63a01eeb843",
-                "sha256:b9c78242219f674ab645ec571c9a95d70f381319a23911941cd2358a8e0521cf",
-                "sha256:bccb267678b870d9782c3b44d0cefe3ba0e329f9af8c946d32bf3778e7a4f271",
-                "sha256:c4df4d27f4c93b2cef74579f00b1d3a31a929c7d8023f870c4b476f03a274db4",
-                "sha256:caf0e50b546bb60dfa99bb18dfa6748458a83131ecdceaf5c071d74907e7e78a",
-                "sha256:d3266bd3ac59ac4edcd5fa75165dee80b94a3e5c91049df5f7c057ccf097551c",
-                "sha256:db0d213987bcd4e6d41710fb4532b22315b0d8fb439ff901782234456556aed1",
-                "sha256:dbbd5cf7690a40a9f0a9325ab480d0fccf46d16b378eefc08e195d84299bfae1",
-                "sha256:e16e07a0ec3a75b5ee61f2b1003c35696738f937dc8148fbda9fe2147ccb6e61",
-                "sha256:e175a006725c7faadbe69e791877d09936c0ef2cf49d01b60a6c1efcb0e8be6f",
-                "sha256:edd9c13a97f6550f9da2236126bb51c092b3b1ce6187f2bd966533ad794bbb5e",
-                "sha256:fa39ea60d527fbdd94215b5e5552f1c6a912624521093f1384a491a8ad89ad8b"
+                "sha256:0448576c148c129594d890265b1a83b9cd76fd1f0a6a04620753d9a6bcfd0a4d",
+                "sha256:127f76864468d6630e1b453d3ffbbd04b024c674f55cf0a30dc2595137892d37",
+                "sha256:1471cee35eba321827d7d53d104e7b8c593ea3ad376aa2df89533ce8e1b24a01",
+                "sha256:2363c35637d2d9d6f26f60a208819e7eafc4305ce39dc1d5005eccc4593331c2",
+                "sha256:2e5cc908fe43fe1aa299e58046ad66981131a66aea3129aac7770c37f590a644",
+                "sha256:2e6fd1b8acd005bd71e6c94f30c055594bbd0aa02ef51a22bbfa961ab63b2d75",
+                "sha256:366cb750140f221523fa062d641393092813b81e15d0e25d9f7c6025f910ee80",
+                "sha256:42ebca24ba2a21065fb546f3e6bd0c58c3fe9ac298f3a320147029a4850f51a2",
+                "sha256:4e751e77006da34643ab782e4a5cc21ea7b755551db202bc4d3a423b307db780",
+                "sha256:4fb85c447e288df535b17ebdebf0ec1cf3a3f1a8eba7e79169f4f37af43c6b98",
+                "sha256:50c348995b47b5a4e330362cf39fc503b4a43b14a91c34c83b955e1805c8e308",
+                "sha256:535332fe9d00c3cd455bd3dd7d4bacab86e2d564bdf7606079160fa6251caacf",
+                "sha256:535f067002b0fd1a4e5296a8f1bf88193080ff992a195e66964ef2a6cfec5388",
+                "sha256:5be4a2e212bb6aa045e37f7d48e3e1e4b6fd259882ed5a00786f82e8c37ce77d",
+                "sha256:60a20bfc3bd234d54d49c388950195d23a5583d4108e1a1d47c9eef8d8c042b3",
+                "sha256:648914abafe67f11be7d93c1a546068f8eff3c5fa938e1f94509e4a5d682b2d8",
+                "sha256:681d75e1a38a69f1e64ab82fe4b1ed3fd758717bed735fb9aeaa124143f051af",
+                "sha256:68a5d77e440df94011214b7db907ec8f19e439507a70c958f750c18d88f995d2",
+                "sha256:69a63f83e88138ab7642d8f61418cf3180a4d8cd13995df87725cb8b893e950e",
+                "sha256:6e4183800f16f3679076dfa8abf2db3083919d7e30764a069fb66b2b9eff9939",
+                "sha256:6fd8d5903c2e53f49e99359b063df27fdf7acb89a52b6a12494208bf61345a03",
+                "sha256:791394449e98243839fa822a637177dd42a95f4883ad3dec2a0ce6ac99fb0a9d",
+                "sha256:7a7669ff50f41225ca5d6ee0a1ec8413f3a0d8aa2b109f86d540887b7ec0d72a",
+                "sha256:7e9eac1e526386df7c70ef253b792a0a12dd86d833b1d329e038c7a235dfceb5",
+                "sha256:7ee8af0b9f7de635c61cdd5b8534b76c52cd03536f29f51151b377f76e214a1a",
+                "sha256:8246f30ca34dc712ab07e51dc34fea883c00b7ccb0e614651e49da2c49a30711",
+                "sha256:8c88b599e226994ad4db29d93bc149aa1aff3dc3a4355dd5757569ba78632bdf",
+                "sha256:923963e989ffbceaa210ac37afc9b906acebe945d2723e9679b643513837b089",
+                "sha256:94d55bd03d8671686e3f012577d9caa5421a07286dd351dfef64791cf7c6c505",
+                "sha256:97db258793d193c7b62d4e2586c6ed98d51086e93f9a3af2b2034af01450a74b",
+                "sha256:a9d6bc8642e2c67db33f1247a77c53476f3a166e09067c0474facb045756087f",
+                "sha256:cd11c7e8d21af997ee8079037fff88f16fda188a9776eb4b81c7e4c9c0a7d7fc",
+                "sha256:d8d3d4713f0c28bdc6c806a278d998546e8efc3498949e3ace6e117462ac0a5e",
+                "sha256:e0bfe9bb028974a481410432dbe1b182e8191d5d40382e5b8ff39cdd2e5c5931",
+                "sha256:f4822c0660c3754f1a41a655e37cb4dbbc9be3d35b125a37fab6f82d47674ebc",
+                "sha256:f83d281bb2a6217cd806f4cf0ddded436790e66f393e124dfe9731f6b3fb9afe",
+                "sha256:fc37870d6716b137e80d19241d0e2cff7a7643b925dfa49b4c8ebd1295eb506e"
             ],
             "index": "pypi",
-            "version": "==4.2.5"
+            "version": "==4.6.2"
         },
         "requests": {
             "hashes": [
@@ -83,11 +90,10 @@
         },
         "urllib3": {
             "hashes": [
-                "sha256:4c291ca23bbb55c76518905869ef34bdd5f0e46af7afe6861e8375643ffee1a0",
-                "sha256:9a247273df709c4fedb38c711e44292304f73f39ab01beda9f6b9fc375669ac3"
+                "sha256:2393a695cd12afedd0dcb26fe5d50d0cf248e5a66f75dbd89a3d4eb333a61af4",
+                "sha256:a637e5fae88995b256e3409dc4d52c2e2e0ba32c42a6365fee8bbd2238de3cfb"
             ],
-            "index": "pypi",
-            "version": "==1.24.2"
+            "version": "==1.24.3"
         }
     },
     "develop": {}

From 0d70122d95d5ba45818097ad69678fd06407672a Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Mon, 22 Mar 2021 17:07:50 +0000
Subject: [PATCH 096/100] Bump lxml from 4.6.2 to 4.6.3

Bumps [lxml](https://github.com/lxml/lxml) from 4.6.2 to 4.6.3.
- [Release notes](https://github.com/lxml/lxml/releases)
- [Changelog](https://github.com/lxml/lxml/blob/master/CHANGES.txt)
- [Commits](https://github.com/lxml/lxml/compare/lxml-4.6.2...lxml-4.6.3)

Signed-off-by: dependabot[bot] <support@github.com>
---
 Pipfile.lock | 73 +++++++++++++++++++++++++---------------------------
 1 file changed, 35 insertions(+), 38 deletions(-)

diff --git a/Pipfile.lock b/Pipfile.lock
index d469438..c4d1c63 100644
--- a/Pipfile.lock
+++ b/Pipfile.lock
@@ -39,46 +39,43 @@
         },
         "lxml": {
             "hashes": [
-                "sha256:0448576c148c129594d890265b1a83b9cd76fd1f0a6a04620753d9a6bcfd0a4d",
-                "sha256:127f76864468d6630e1b453d3ffbbd04b024c674f55cf0a30dc2595137892d37",
-                "sha256:1471cee35eba321827d7d53d104e7b8c593ea3ad376aa2df89533ce8e1b24a01",
-                "sha256:2363c35637d2d9d6f26f60a208819e7eafc4305ce39dc1d5005eccc4593331c2",
-                "sha256:2e5cc908fe43fe1aa299e58046ad66981131a66aea3129aac7770c37f590a644",
-                "sha256:2e6fd1b8acd005bd71e6c94f30c055594bbd0aa02ef51a22bbfa961ab63b2d75",
-                "sha256:366cb750140f221523fa062d641393092813b81e15d0e25d9f7c6025f910ee80",
-                "sha256:42ebca24ba2a21065fb546f3e6bd0c58c3fe9ac298f3a320147029a4850f51a2",
-                "sha256:4e751e77006da34643ab782e4a5cc21ea7b755551db202bc4d3a423b307db780",
-                "sha256:4fb85c447e288df535b17ebdebf0ec1cf3a3f1a8eba7e79169f4f37af43c6b98",
-                "sha256:50c348995b47b5a4e330362cf39fc503b4a43b14a91c34c83b955e1805c8e308",
-                "sha256:535332fe9d00c3cd455bd3dd7d4bacab86e2d564bdf7606079160fa6251caacf",
-                "sha256:535f067002b0fd1a4e5296a8f1bf88193080ff992a195e66964ef2a6cfec5388",
-                "sha256:5be4a2e212bb6aa045e37f7d48e3e1e4b6fd259882ed5a00786f82e8c37ce77d",
-                "sha256:60a20bfc3bd234d54d49c388950195d23a5583d4108e1a1d47c9eef8d8c042b3",
-                "sha256:648914abafe67f11be7d93c1a546068f8eff3c5fa938e1f94509e4a5d682b2d8",
-                "sha256:681d75e1a38a69f1e64ab82fe4b1ed3fd758717bed735fb9aeaa124143f051af",
-                "sha256:68a5d77e440df94011214b7db907ec8f19e439507a70c958f750c18d88f995d2",
-                "sha256:69a63f83e88138ab7642d8f61418cf3180a4d8cd13995df87725cb8b893e950e",
-                "sha256:6e4183800f16f3679076dfa8abf2db3083919d7e30764a069fb66b2b9eff9939",
-                "sha256:6fd8d5903c2e53f49e99359b063df27fdf7acb89a52b6a12494208bf61345a03",
-                "sha256:791394449e98243839fa822a637177dd42a95f4883ad3dec2a0ce6ac99fb0a9d",
-                "sha256:7a7669ff50f41225ca5d6ee0a1ec8413f3a0d8aa2b109f86d540887b7ec0d72a",
-                "sha256:7e9eac1e526386df7c70ef253b792a0a12dd86d833b1d329e038c7a235dfceb5",
-                "sha256:7ee8af0b9f7de635c61cdd5b8534b76c52cd03536f29f51151b377f76e214a1a",
-                "sha256:8246f30ca34dc712ab07e51dc34fea883c00b7ccb0e614651e49da2c49a30711",
-                "sha256:8c88b599e226994ad4db29d93bc149aa1aff3dc3a4355dd5757569ba78632bdf",
-                "sha256:923963e989ffbceaa210ac37afc9b906acebe945d2723e9679b643513837b089",
-                "sha256:94d55bd03d8671686e3f012577d9caa5421a07286dd351dfef64791cf7c6c505",
-                "sha256:97db258793d193c7b62d4e2586c6ed98d51086e93f9a3af2b2034af01450a74b",
-                "sha256:a9d6bc8642e2c67db33f1247a77c53476f3a166e09067c0474facb045756087f",
-                "sha256:cd11c7e8d21af997ee8079037fff88f16fda188a9776eb4b81c7e4c9c0a7d7fc",
-                "sha256:d8d3d4713f0c28bdc6c806a278d998546e8efc3498949e3ace6e117462ac0a5e",
-                "sha256:e0bfe9bb028974a481410432dbe1b182e8191d5d40382e5b8ff39cdd2e5c5931",
-                "sha256:f4822c0660c3754f1a41a655e37cb4dbbc9be3d35b125a37fab6f82d47674ebc",
-                "sha256:f83d281bb2a6217cd806f4cf0ddded436790e66f393e124dfe9731f6b3fb9afe",
-                "sha256:fc37870d6716b137e80d19241d0e2cff7a7643b925dfa49b4c8ebd1295eb506e"
+                "sha256:079f3ae844f38982d156efce585bc540c16a926d4436712cf4baee0cce487a3d",
+                "sha256:0fbcf5565ac01dff87cbfc0ff323515c823081c5777a9fc7703ff58388c258c3",
+                "sha256:122fba10466c7bd4178b07dba427aa516286b846b2cbd6f6169141917283aae2",
+                "sha256:1b7584d421d254ab86d4f0b13ec662a9014397678a7c4265a02a6d7c2b18a75f",
+                "sha256:26e761ab5b07adf5f555ee82fb4bfc35bf93750499c6c7614bd64d12aaa67927",
+                "sha256:289e9ca1a9287f08daaf796d96e06cb2bc2958891d7911ac7cae1c5f9e1e0ee3",
+                "sha256:2a9d50e69aac3ebee695424f7dbd7b8c6d6eb7de2a2eb6b0f6c7db6aa41e02b7",
+                "sha256:33bb934a044cf32157c12bfcfbb6649807da20aa92c062ef51903415c704704f",
+                "sha256:3439c71103ef0e904ea0a1901611863e51f50b5cd5e8654a151740fde5e1cade",
+                "sha256:39b78571b3b30645ac77b95f7c69d1bffc4cf8c3b157c435a34da72e78c82468",
+                "sha256:4289728b5e2000a4ad4ab8da6e1db2e093c63c08bdc0414799ee776a3f78da4b",
+                "sha256:4bff24dfeea62f2e56f5bab929b4428ae6caba2d1eea0c2d6eb618e30a71e6d4",
+                "sha256:542d454665a3e277f76954418124d67516c5f88e51a900365ed54a9806122b83",
+                "sha256:5a0a14e264069c03e46f926be0d8919f4105c1623d620e7ec0e612a2e9bf1c04",
+                "sha256:66e575c62792c3f9ca47cb8b6fab9e35bab91360c783d1606f758761810c9791",
+                "sha256:7610b8c31688f0b1be0ef882889817939490a36d0ee880ea562a4e1399c447a1",
+                "sha256:76fa7b1362d19f8fbd3e75fe2fb7c79359b0af8747e6f7141c338f0bee2f871a",
+                "sha256:7728e05c35412ba36d3e9795ae8995e3c86958179c9770e65558ec3fdfd3724f",
+                "sha256:8157dadbb09a34a6bd95a50690595e1fa0af1a99445e2744110e3dca7831c4ee",
+                "sha256:820628b7b3135403540202e60551e741f9b6d3304371712521be939470b454ec",
+                "sha256:884ab9b29feaca361f7f88d811b1eea9bfca36cf3da27768d28ad45c3ee6f969",
+                "sha256:89b8b22a5ff72d89d48d0e62abb14340d9e99fd637d046c27b8b257a01ffbe28",
+                "sha256:92e821e43ad382332eade6812e298dc9701c75fe289f2a2d39c7960b43d1e92a",
+                "sha256:b007cbb845b28db4fb8b6a5cdcbf65bacb16a8bd328b53cbc0698688a68e1caa",
+                "sha256:bc4313cbeb0e7a416a488d72f9680fffffc645f8a838bd2193809881c67dd106",
+                "sha256:bccbfc27563652de7dc9bdc595cb25e90b59c5f8e23e806ed0fd623755b6565d",
+                "sha256:c4f05c5a7c49d2fb70223d0d5bcfbe474cf928310ac9fa6a7c6dddc831d0b1d4",
+                "sha256:ce256aaa50f6cc9a649c51be3cd4ff142d67295bfc4f490c9134d0f9f6d58ef0",
+                "sha256:d2e35d7bf1c1ac8c538f88d26b396e73dd81440d59c1ef8522e1ea77b345ede4",
+                "sha256:df7c53783a46febb0e70f6b05df2ba104610f2fb0d27023409734a3ecbb78fb2",
+                "sha256:efac139c3f0bf4f0939f9375af4b02c5ad83a622de52d6dfa8e438e8e01d0eb0",
+                "sha256:efd7a09678fd8b53117f6bae4fa3825e0a22b03ef0a932e070c0bdbb3a35e654",
+                "sha256:f2380a6376dfa090227b663f9678150ef27543483055cc327555fb592c5967e2",
+                "sha256:f8380c03e45cf09f8557bdaa41e1fa7c81f3ae22828e1db470ab2a6c96d8bc23"
             ],
             "index": "pypi",
-            "version": "==4.6.2"
+            "version": "==4.6.3"
         },
         "requests": {
             "hashes": [

From 8aca84cad3d976d45b56d7841e991f7312deb6b3 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Wed, 24 Mar 2021 22:14:09 +0100
Subject: [PATCH 097/100] Update README.md

---
 README.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/README.md b/README.md
index b9bbc0f..c920eb9 100644
--- a/README.md
+++ b/README.md
@@ -82,6 +82,7 @@ If you don't want to cache the cookies, just use the `--no-cookies` option and p
 
 You can configure proxies by setting on your system the environment variable `HTTPS_PROXY` or using the `USE_PROXY` directive into the script.
 
+#### Calibre EPUB conversion
 **Important**: since the script only download HTML pages and create a raw EPUB, many of the CSS and XML/HTML directives are wrong for an E-Reader. To ensure best quality of the output, I suggest you to always convert the `EPUB` obtained by the script to standard-`EPUB` with [Calibre](https://calibre-ebook.com/).
 You can also use the command-line version of Calibre with `ebook-convert`, e.g.:
 ```bash

From 2af69e2d253df33636c2e783055b7644c15eac72 Mon Sep 17 00:00:00 2001
From: Lorenzo Di Fuccia <lorenzo.difuccia@gmail.com>
Date: Fri, 21 May 2021 23:47:36 +0200
Subject: [PATCH 098/100] https://www.google.com/?q=Are+they+blocking+us?

---
 safaribooks.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/safaribooks.py b/safaribooks.py
index 26c9f62..c3382bb 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -1,11 +1,11 @@
 #!/usr/bin/env python3
 # coding: utf-8
-import pathlib
 import re
 import os
 import sys
 import json
 import shutil
+import pathlib
 import getpass
 import logging
 import argparse
@@ -304,7 +304,7 @@ class SafariBooks:
         "Referer": LOGIN_ENTRY_URL,
         "Upgrade-Insecure-Requests": "1",
         "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
-                      "Chrome/80.0.3987.163 Safari/537.36"
+                      "Chrome/90.0.4430.212 Safari/537.36"
     }
 
     COOKIE_FLOAT_MAX_AGE_PATTERN = re.compile(r'(max-age=\d*\.\d*)', re.IGNORECASE)
@@ -381,7 +381,7 @@ def __init__(self, args):
         self.cover = False
         self.get()
         if not self.cover:
-            self.cover = self.get_default_cover()
+            self.cover = self.get_default_cover() if "cover" in self.book_info else False
             cover_html = self.parse_html(
                 html.fromstring("<div id=\"sbo-rt-content\"><img src=\"Images/{0}\"></div>".format(self.cover)), True
             )
@@ -1013,7 +1013,7 @@ def create_toc(self):
             (self.book_info["isbn"] if self.book_info["isbn"] else self.book_id),
             max_depth,
             self.book_title,
-            ", ".join(aut["name"] for aut in self.book_info["authors"]),
+            ", ".join(aut.get("name", "") for aut in self.book_info.get("authors", [])),
             navmap
         )
 

From 3e7be118d2e050d7ec98975475cf84a8808ab79b Mon Sep 17 00:00:00 2001
From: Marcel Schmalzl <holzkohlengrill@gmail.com>
Date: Fri, 16 Jul 2021 18:22:38 +0200
Subject: [PATCH 099/100] Added proxy option

---
 README.md      |  1 +
 safaribooks.py | 29 +++++++++++++++++++++--------
 2 files changed, 22 insertions(+), 8 deletions(-)

diff --git a/README.md b/README.md
index c920eb9..094af65 100644
--- a/README.md
+++ b/README.md
@@ -63,6 +63,7 @@ optional arguments:
                        "account_mail@mail.com:password01" `.
   --login              Prompt for credentials used to perform the auth login
                        on Safari Books Online.
+  --proxy PROXY        Add proxy URL and port (e.g. `https://127.0.0.1:8080`)
   --no-cookies         Prevent your session data to be saved into
                        `cookies.json` file.
   --kindle             Add some CSS rules that block overflow on `table` and
diff --git a/safaribooks.py b/safaribooks.py
index c3382bb..03bef02 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -31,10 +31,6 @@
 API_ORIGIN_URL = "https://" + API_ORIGIN_HOST
 PROFILE_URL = SAFARI_BASE_URL + "/profile/"
 
-# DEBUG
-USE_PROXY = False
-PROXIES = {"https": "https://127.0.0.1:8080"}
-
 
 class Display:
     BASE_FORMAT = logging.Formatter(
@@ -315,9 +311,9 @@ def __init__(self, args):
         self.display.intro()
 
         self.session = requests.Session()
-        if USE_PROXY:  # DEBUG
-            self.session.proxies = PROXIES
-            self.session.verify = False
+        if args_parsed.proxies:
+            self.session.proxies = args_parsed.proxies
+            # self.session.verify = False
 
         self.session.headers.update(self.HEADERS)
 
@@ -1062,7 +1058,10 @@ def create_epub(self):
         "--login", action='store_true',
         help="Prompt for credentials used to perform the auth login on Safari Books Online."
     )
-
+    arguments.add_argument(
+        "--proxy",
+        help="Add proxy URL and port (e.g. `https://127.0.0.1:8080`)"
+    )
     arguments.add_argument(
         "--no-cookies", dest="no_cookies", action='store_true',
         help="Prevent your session data to be saved into `cookies.json` file."
@@ -1109,6 +1108,20 @@ def create_epub(self):
         if args_parsed.no_cookies:
             arguments.error("invalid option: `--no-cookies` is valid only if you use the `--cred` option")
 
+    if args_parsed.proxy:
+        proxy_regex = r"http[s]?://[a-zA-Z0-9.-]+:\d{4}"          # Matches proxy URL
+        pattern = re.compile(proxy_regex)
+        match = re.search(pattern, args_parsed.proxy)
+        if match:
+            result = match.group()
+            args_parsed.proxies = {
+                "http": result,
+                "https": result
+            }
+        else:
+            arguments.error(f"Incorrect proxy format (should match the regex: `{proxy_regex}`)")
+
+
     SafariBooks(args_parsed)
     # Hint: do you want to download more then one book once, initialized more than one instance of `SafariBooks`...
     sys.exit(0)

From 9e0ce4656299d0b2184649b0e43a93bf9f3f7d5e Mon Sep 17 00:00:00 2001
From: Marcel Schmalzl <holzkohlengrill@gmail.com>
Date: Fri, 16 Jul 2021 20:02:00 +0200
Subject: [PATCH 100/100] Fixed OSError: [Errno 22] Invalid argument error for
 book ID

---
 safaribooks.py | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/safaribooks.py b/safaribooks.py
index c3382bb..50e2655 100755
--- a/safaribooks.py
+++ b/safaribooks.py
@@ -1109,6 +1109,16 @@ def create_epub(self):
         if args_parsed.no_cookies:
             arguments.error("invalid option: `--no-cookies` is valid only if you use the `--cred` option")
 
+    if len(args_parsed.bookid) > 0:
+        bookID = args_parsed.bookid.split("/")[-1]          # Only get book ID from URL
+        if str.isdecimal(bookID):
+            args_parsed.bookid = bookID
+        else:
+            arguments.error("Invalid book ID")
+    else:
+        arguments.error("Book ID must not be empty")
+
+
     SafariBooks(args_parsed)
     # Hint: do you want to download more then one book once, initialized more than one instance of `SafariBooks`...
     sys.exit(0)