summaryrefslogtreecommitdiff
path: root/scripts/crawler/tbc_web_crawler/spiders/items.py
diff options
context:
space:
mode:
Diffstat (limited to 'scripts/crawler/tbc_web_crawler/spiders/items.py')
-rw-r--r--scripts/crawler/tbc_web_crawler/spiders/items.py18
1 files changed, 18 insertions, 0 deletions
diff --git a/scripts/crawler/tbc_web_crawler/spiders/items.py b/scripts/crawler/tbc_web_crawler/spiders/items.py
new file mode 100644
index 0000000..9dda20f
--- /dev/null
+++ b/scripts/crawler/tbc_web_crawler/spiders/items.py
@@ -0,0 +1,18 @@
+import scrapy
+
+
+class TbcErrorItems(scrapy.Item):
+
+
+ chapter_name = scrapy.Field()
+ chapter_urls = scrapy.Field()
+ completed_book_urls = scrapy.Field()
+ number_of_errors = scrapy.Field()
+ error_messages = scrapy.Field()
+
+
+
+class TbcBrokenItems(scrapy.Item):
+
+ broken_url = scrapy.Field()
+ broken_status = scrapy.Field()