fabianvf/storage.py

## storage.py
import os
import json

from scrapi.processing.base import BaseProcessor


class StorageProcessor(BaseProcessor):
    NAME = 'storage'

    def process_raw(self, raw):
        filename = 'archive/{}/{}/raw.{}'.format(raw['source'], raw['docID'], raw['filetype'])
        if not os.path.exists(os.path.dirname(filename)):
            os.makedirs(os.path.dirname(filename))

        with open(filename, 'w') as f:
            f.write(json.dumps(raw.attributes, indent=4))

    def process_normalized(self, raw, normalized):
        filename = 'archive/{}/{}/normalized.json'.format(raw['source'], raw['docID'], raw['filetype'])
        if not os.path.exists(os.path.dirname(filename)):
            os.makedirs(os.path.dirname(filename))

        with open(filename, 'w') as f:
            f.write(json.dumps(normalized.attributes, indent=4))
	import os
	import json

	from scrapi.processing.base import BaseProcessor


	class StorageProcessor(BaseProcessor):
	NAME = 'storage'

	def process_raw(self, raw):
	filename = 'archive/{}/{}/raw.{}'.format(raw['source'], raw['docID'], raw['filetype'])
	if not os.path.exists(os.path.dirname(filename)):
	os.makedirs(os.path.dirname(filename))

	with open(filename, 'w') as f:
	f.write(json.dumps(raw.attributes, indent=4))

	def process_normalized(self, raw, normalized):
	filename = 'archive/{}/{}/normalized.json'.format(raw['source'], raw['docID'], raw['filetype'])
	if not os.path.exists(os.path.dirname(filename)):
	os.makedirs(os.path.dirname(filename))

	with open(filename, 'w') as f:
	f.write(json.dumps(normalized.attributes, indent=4))