SHA1
--- a/.gitignore
+++ b/.gitignore
@@ -58,3 +58,5 @@ docs/_build/
 
				 # PyBuilder
			
 
				 target/
			
 
				 
			
 
				+__init__.py
			
 
				+
			
--- a/daemon_process.py
+++ b/daemon_process.py
@@ -0,0 +1,33 @@
 
				+#!/usr/bin/env python
			
 
				+
			
 
				+import json
			
 
				+from notify import notify
			
 
				+from time import sleep
			
 
				+import os
			
 
				+
			
 
				+os.system('./run_spider.sh')
			
 
				+
			
 
				+with open('./date.json') as json_data:
			
 
				+    file_content = json.load(json_data)
			
 
				+
			
 
				+curr_date = file_content[0]['date']
			
 
				+
			
 
				+
			
 
				+while True:
			
 
				+    os.system('./run_spider.sh')
			
 
				+    with open('./date.json') as json_data:
			
 
				+        file_content = json.load(json_data)
			
 
				+
			
 
				+    new_date = file_content[0]['date']
			
 
				+
			
 
				+    if new_date != curr_date:
			
 
				+        notify(new_date)
			
 
				+        curr_date = new_date
			
 
				+
			
 
				+    # Sleep for 30 min.
			
 
				+    #
			
 
				+    sleep(1800)
			
 
				+
			
 
				+
			
 
				+# EOF
			
 
				+# vim: set tabstop=4 shiftwidth=4 expandtab :
			
--- a/date.json
+++ b/date.json
@@ -0,0 +1,3 @@
 
				+[
			
 
				+{"date": "2018-06-04"}
			
 
				+]
			
--- a/driver_spider.py
+++ b/driver_spider.py
@@ -0,0 +1,61 @@
 
				+#!/usr/bin/env python
			
 
				+
			
 
				+import scrapy
			
 
				+import re
			
 
				+
			
 
				+
			
 
				+class LoginSpider(scrapy.Spider):
			
 
				+    name = 'uk-driver-spider'
			
 
				+    login_url = 'https://driverpracticaltest.direct.gov.uk/login'
			
 
				+    core_url = 'https://driverpracticaltest.direct.gov.uk'
			
 
				+    start_urls = [login_url]
			
 
				+
			
 
				+    def parse(self, response):
			
 
				+
			
 
				+        # Get username and password.
			
 
				+        #
			
 
				+        with open('./username', 'r') as f:
			
 
				+            username = f.read()
			
 
				+        with open('./password', 'r') as f:
			
 
				+            password = f.read()
			
 
				+
			
 
				+        self.logger.info('\nUSER {}PASS {}'.format(username, password))
			
 
				+        return scrapy.FormRequest.from_response(
			
 
				+            response,
			
 
				+            formdata={'username': username, 'password': password},
			
 
				+            callback=self.after_login
			
 
				+        )
			
 
				+
			
 
				+    def after_login(self, response):
			
 
				+        # Check login succeed before going on.
			
 
				+        #
			
 
				+        if 'authentication failed' in response.body:
			
 
				+            self.logger.error('Login failed')
			
 
				+            return
			
 
				+
			
 
				+        # Obtain the csrftoken.
			
 
				+        #
			
 
				+        href_w_token = response.xpath('//a[@id="date-time-change"]').extract()
			
 
				+        token = re.search(r'csrftoken=[\w]+', str(href_w_token)).group(0).split('=')[1]
			
 
				+        self.logger.info(token)
			
 
				+
			
 
				+        url = self.core_url + response.xpath('//a[@id="date-time-change"]/@href').extract_first()
			
 
				+        self.logger.info(url)
			
 
				+
			
 
				+        yield scrapy.Request(url, callback=self.after_change)
			
 
				+
			
 
				+    def after_change(self, response):
			
 
				+        return scrapy.FormRequest.from_response(
			
 
				+            response,
			
 
				+            callback=self.parse_calendar
			
 
				+        )
			
 
				+
			
 
				+    def parse_calendar(self, response):
			
 
				+        earliest_date = response.xpath('//td[contains(@class, "bookable")]//a/@href').extract_first()[6:]
			
 
				+
			
 
				+        yield{
			
 
				+            'date': earliest_date
			
 
				+        }
			
 
				+
			
 
				+# EOF
			
 
				+# vim: set tabstop=4 shiftwidth=4 expandtab :
			
--- a/email_login
+++ b/email_login
--- a/email_password
+++ b/email_password
--- a/notify.py
+++ b/notify.py
@@ -0,0 +1,22 @@
 
				+#!/usr/bin/env python
			
 
				+
			
 
				+
			
 
				+def notify(message):
			
 
				+
			
 
				+    import smtplib
			
 
				+
			
 
				+    with open('./email_login', 'r') as f:
			
 
				+        username = f.read()
			
 
				+    with open('./email_password', 'r') as f:
			
 
				+        password = f.read()
			
 
				+    with open('./send_to', 'r') as f:
			
 
				+        send_to = f.read()
			
 
				+
			
 
				+    server = smtplib.SMTP('smtp.gmail.com', 587)
			
 
				+    server.starttls()
			
 
				+    server.login(username, password)
			
 
				+    server.sendmail(username, send_to, message)
			
 
				+    server.quit()
			
 
				+
			
 
				+# EOF
			
 
				+# vim: set tabstop=4 shiftwidth=4 expandtab :
			
--- a/password
+++ b/password
--- a/run_spider.sh
+++ b/run_spider.sh
@@ -0,0 +1,8 @@
 
				+#!/usr/bin/env bash
			
 
				+
			
 
				+rm ./date.json
			
 
				+scrapy runspider ./driver_spider.py -o ./date.json
			
 
				+
			
 
				+
			
 
				+# EOF
			
 
				+# vim: set tabstop=4 shiftwidth=4 expandtab :
			
--- a/send_to
+++ b/send_to
Auteur	SHA1 Message	Date
Kirill Kupriyanov	dad2688deb Use calendar to retrieve the earliest date.	il y a 6 ans
Kirill Kupriyanov	718393b0a5 Edit gitignore to ignore __init__.py.	il y a 6 ans
Kirill Kupriyanov	99bcfc3873 Web spider for retrieving earliest date.	il y a 6 ans
Kirill Kupriyanov	1aa2433409 Email login and password security files.	il y a 6 ans
Kirill Kupriyanov	5d7af2a08a Username, password security files.	il y a 6 ans