Browse Source

Move SitemapItem class into generator.spiders.sitemap_file

This will solve the following issue:

ImportError: No module named sitemap.generator

Change-Id: I449f0fb0c87613c36447cca94f4f5857f3d31afa
tags/1.2.1
Christian Berendt 3 years ago
parent
commit
92a4fb6527
2 changed files with 10 additions and 23 deletions
  1. 0
    21
      sitemap/generator/items.py
  2. 10
    2
      sitemap/generator/spiders/sitemap_file.py

+ 0
- 21
sitemap/generator/items.py View File

@@ -1,21 +0,0 @@
# Licensed under the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License. You may obtain
# a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.

import scrapy


class SitemapItem(scrapy.item.Item):
'''Class to represent an item in the sitemap.'''
loc = scrapy.item.Field()
lastmod = scrapy.item.Field()
priority = scrapy.item.Field()
changefreq = scrapy.item.Field()

+ 10
- 2
sitemap/generator/spiders/sitemap_file.py View File

@@ -13,9 +13,17 @@
import time
import urlparse

from scrapy import item
from scrapy.linkextractors import LinkExtractor
from scrapy import spiders
from sitemap.generator import items


class SitemapItem(item.Item):
'''Class to represent an item in the sitemap.'''
loc = item.Field()
lastmod = item.Field()
priority = item.Field()
changefreq = item.Field()


class SitemapSpider(spiders.CrawlSpider):
@@ -68,7 +76,7 @@ class SitemapSpider(spiders.CrawlSpider):
self.start_urls.append(url)

def parse_item(self, response):
item = items.SitemapItem()
item = SitemapItem()
item['loc'] = response.url

path = urlparse.urlsplit(response.url).path

Loading…
Cancel
Save