amititash
diff --git a/‎furnstyl/furnstyl.py
+50 b/‎furnstyl/furnstyl.py
+50
diff --git a/‎furnstyl/furnstyl.pyc
2.14 KB b/‎furnstyl/furnstyl.pyc
2.14 KB
diff --git a/‎kwaldecal.py
+63 b/‎kwaldecal.py
+63
diff --git a/‎kwaldecal.pyc
2.3 KB b/‎kwaldecal.pyc
2.3 KB
diff --git a/‎kwaldecal/13_kwd.py
+63 b/‎kwaldecal/13_kwd.py
+63
diff --git a/‎kwaldecal/13_kwd.pyc
2.34 KB b/‎kwaldecal/13_kwd.pyc
2.34 KB
diff --git a/‎kwaldecal/14_kwd.py
+63 b/‎kwaldecal/14_kwd.py
+63
diff --git a/‎kwaldecal/14_kwd.pyc
2.34 KB b/‎kwaldecal/14_kwd.pyc
2.34 KB
diff --git a/‎kwaldecal/15_kwd.py
+63 b/‎kwaldecal/15_kwd.py
+63
diff --git a/‎kwaldecal/15_kwd.pyc
2.35 KB b/‎kwaldecal/15_kwd.pyc
2.35 KB
diff --git a/‎kwaldecal/16_kwd.py
+63 b/‎kwaldecal/16_kwd.py
+63
diff --git a/‎kwaldecal/16_kwd.pyc
2.34 KB b/‎kwaldecal/16_kwd.pyc
2.34 KB
@@ -0,0 +1,50 @@
+
+import scrapy
+import logging
+from scrapy.contrib.spiders import Rule
+from scrapy.contrib.linkextractors.sgml import SgmlLinkExtractor
+from scrapy.selector import HtmlXPathSelector
+
+from scrapy import Request, Spider
+from scrapy.exceptions import CloseSpider
+from scrapy.selector import Selector
+
+
+from scrapy.item import Item, Field
+
+class ScrapySampleItem(Item):
+    title = Field()
+    link = Field()
+    desc = Field()
+    price =  Field()
+    image = Field()
+    
+    
+class StackOverflowSpider(scrapy.Spider): 
+
+        name = 'furnstyl' 
+        start_urls = ['http://www.furnstyl.com/furniture'] 
+
+		
+        def parse(self, response): 
+            for href in response.css('.product-image::attr(href)'): 
+              full_url = response.urljoin(href.extract()) 
+              yield scrapy.Request(full_url, callback=self.parse_product) 
+
+        def parse_product(self, response):
+           items = []
+           item = ScrapySampleItem()
+    
+           item['title'] =  response.css('h1::text').extract_first()
+           item['image'] =  response.css('.cloud-zoom img::attr(src)').extract_first()
+           item['desc']  = response.css('div[id="product_tabs_description_contents"] .std').extract()
+           item['price'] = response.css('.price').extract_first()
+           
+           if not item['desc']:
+               logging.info("EMPTY RECIEVED")
+               item['desc']  = response.css('h1::text').extract_first()
+           item['link']  = response.url
+           items.append(item)
+    		
+           for item in items:
+               yield item 
@@ -0,0 +1,63 @@
+
+import scrapy
+import logging
+from scrapy.contrib.spiders import Rule
+from scrapy.contrib.linkextractors.sgml import SgmlLinkExtractor
+from scrapy.selector import HtmlXPathSelector
+
+from scrapy import Request, Spider
+from scrapy.exceptions import CloseSpider
+from scrapy.selector import Selector
+
+
+from scrapy.item import Item, Field
+
+
+URL = 'http://kcwalldecals.com/21-ethnic-indian?p={page}'
+
+
+
+class ScrapySampleItem(Item):
+    title = Field()
+    link = Field()
+    desc = Field()
+    image = Field()
+
+
+
+class StackOverflowSpider(scrapy.Spider): 
+    handle_httpstatus_list = [404]
+    name = "kwaldecal"
+    
+    
+    def start_requests(self):
+        index = 1
+        while (index < 3):
+            yield Request(URL.format(page=index))
+            index +=1
+
+    def parse(self, response):
+
+        for href in response.css('.product_img_link::attr(href)'): 
+				full_url = response.urljoin(href.extract()) 
+				yield scrapy.Request(full_url, callback=self.parse_product) 
+				
+    def parse_product(self, response):
+    		
+    		items = []
+    		item = ScrapySampleItem()
+    		
+    		item['title'] =  response.css('h1::text').extract_first()
+    		item['image'] =  response.css('img[id="bigpic"]::attr(src)').extract_first()
+    		item['desc']  = response.css('div[id="short_description_content"] p').extract()
+    		
+    		if not item['desc']:
+    		 logging.info("EMPTY RECIEVED")
+    		 
+    		item['link']  = response.url
+    		
+    		items.append(item)
+    		
+		for item in items:
+			 		yield item
+				
@@ -0,0 +1,63 @@
+
+import scrapy
+import logging
+from scrapy.contrib.spiders import Rule
+from scrapy.contrib.linkextractors.sgml import SgmlLinkExtractor
+from scrapy.selector import HtmlXPathSelector
+
+from scrapy import Request, Spider
+from scrapy.exceptions import CloseSpider
+from scrapy.selector import Selector
+
+
+from scrapy.item import Item, Field
+
+
+URL = 'http://kcwalldecals.com/13-birds-animals?p={page}'
+
+
+
+class ScrapySampleItem(Item):
+    title = Field()
+    link = Field()
+    desc = Field()
+    image = Field()
+
+
+
+class StackOverflowSpider(scrapy.Spider): 
+    handle_httpstatus_list = [404]
+    name = "kwaldecal"
+    
+    
+    def start_requests(self):
+        index = 1
+        while (index < 9):
+            yield Request(URL.format(page=index))
+            index +=1
+
+    def parse(self, response):
+
+        for href in response.css('.product_img_link::attr(href)'): 
+				full_url = response.urljoin(href.extract()) 
+				yield scrapy.Request(full_url, callback=self.parse_product) 
+				
+    def parse_product(self, response):
+    		
+    		items = []
+    		item = ScrapySampleItem()
+    		
+    		item['title'] =  response.css('h1::text').extract_first()
+    		item['image'] =  response.css('img[id="bigpic"]::attr(src)').extract_first()
+    		item['desc']  = response.css('div[id="short_description_content"] p').extract()
+    		
+    		if not item['desc']:
+    		 logging.info("EMPTY RECIEVED")
+    		 
+    		item['link']  = response.url
+    		
+    		items.append(item)
+    		
+		for item in items:
+			 		yield item
+				
@@ -0,0 +1,63 @@
+
+import scrapy
+import logging
+from scrapy.contrib.spiders import Rule
+from scrapy.contrib.linkextractors.sgml import SgmlLinkExtractor
+from scrapy.selector import HtmlXPathSelector
+
+from scrapy import Request, Spider
+from scrapy.exceptions import CloseSpider
+from scrapy.selector import Selector
+
+
+from scrapy.item import Item, Field
+
+
+URL = 'http://kcwalldecals.com/14-modern-graphics?p={page}'
+
+
+
+class ScrapySampleItem(Item):
+    title = Field()
+    link = Field()
+    desc = Field()
+    image = Field()
+
+
+
+class StackOverflowSpider(scrapy.Spider): 
+    handle_httpstatus_list = [404]
+    name = "kwaldecal"
+    
+    
+    def start_requests(self):
+        index = 1
+        while (index < 13):
+            yield Request(URL.format(page=index))
+            index +=1
+
+    def parse(self, response):
+
+        for href in response.css('.product_img_link::attr(href)'): 
+				full_url = response.urljoin(href.extract()) 
+				yield scrapy.Request(full_url, callback=self.parse_product) 
+				
+    def parse_product(self, response):
+    		
+    		items = []
+    		item = ScrapySampleItem()
+    		
+    		item['title'] =  response.css('h1::text').extract_first()
+    		item['image'] =  response.css('img[id="bigpic"]::attr(src)').extract_first()
+    		item['desc']  = response.css('div[id="short_description_content"] p').extract()
+    		
+    		if not item['desc']:
+    		 logging.info("EMPTY RECIEVED")
+    		 
+    		item['link']  = response.url
+    		
+    		items.append(item)
+    		
+		for item in items:
+			 		yield item
+				
@@ -0,0 +1,63 @@
+
+import scrapy
+import logging
+from scrapy.contrib.spiders import Rule
+from scrapy.contrib.linkextractors.sgml import SgmlLinkExtractor
+from scrapy.selector import HtmlXPathSelector
+
+from scrapy import Request, Spider
+from scrapy.exceptions import CloseSpider
+from scrapy.selector import Selector
+
+
+from scrapy.item import Item, Field
+
+
+URL = 'http://kcwalldecals.com/15-nature-wall-decals?p={page}'
+
+
+
+class ScrapySampleItem(Item):
+    title = Field()
+    link = Field()
+    desc = Field()
+    image = Field()
+
+
+
+class StackOverflowSpider(scrapy.Spider): 
+    handle_httpstatus_list = [404]
+    name = "kwaldecal"
+    
+    
+    def start_requests(self):
+        index = 1
+        while (index < 7):
+            yield Request(URL.format(page=index))
+            index +=1
+
+    def parse(self, response):
+
+        for href in response.css('.product_img_link::attr(href)'): 
+				full_url = response.urljoin(href.extract()) 
+				yield scrapy.Request(full_url, callback=self.parse_product) 
+				
+    def parse_product(self, response):
+    		
+    		items = []
+    		item = ScrapySampleItem()
+    		
+    		item['title'] =  response.css('h1::text').extract_first()
+    		item['image'] =  response.css('img[id="bigpic"]::attr(src)').extract_first()
+    		item['desc']  = response.css('div[id="short_description_content"] p').extract()
+    		
+    		if not item['desc']:
+    		 logging.info("EMPTY RECIEVED")
+    		 
+    		item['link']  = response.url
+    		
+    		items.append(item)
+    		
+		for item in items:
+			 		yield item
+				
@@ -0,0 +1,63 @@
+
+import scrapy
+import logging
+from scrapy.contrib.spiders import Rule
+from scrapy.contrib.linkextractors.sgml import SgmlLinkExtractor
+from scrapy.selector import HtmlXPathSelector
+
+from scrapy import Request, Spider
+from scrapy.exceptions import CloseSpider
+from scrapy.selector import Selector
+
+
+from scrapy.item import Item, Field
+
+
+URL = 'http://kcwalldecals.com/16-kids-decals?p={page}'
+
+
+
+class ScrapySampleItem(Item):
+    title = Field()
+    link = Field()
+    desc = Field()
+    image = Field()
+
+
+
+class StackOverflowSpider(scrapy.Spider): 
+    handle_httpstatus_list = [404]
+    name = "kwaldecal"
+    
+    
+    def start_requests(self):
+        index = 1
+        while (index < 7):
+            yield Request(URL.format(page=index))
+            index +=1
+
+    def parse(self, response):
+
+        for href in response.css('.product_img_link::attr(href)'): 
+				full_url = response.urljoin(href.extract()) 
+				yield scrapy.Request(full_url, callback=self.parse_product) 
+				
+    def parse_product(self, response):
+    		
+    		items = []
+    		item = ScrapySampleItem()
+    		
+    		item['title'] =  response.css('h1::text').extract_first()
+    		item['image'] =  response.css('img[id="bigpic"]::attr(src)').extract_first()
+    		item['desc']  = response.css('div[id="short_description_content"] p').extract()
+    		
+    		if not item['desc']:
+    		 logging.info("EMPTY RECIEVED")
+    		 
+    		item['link']  = response.url
+    		
+    		items.append(item)
+    		
+		for item in items:
+			 		yield item
+